<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR Med Inform</journal-id><journal-id journal-id-type="publisher-id">medinform</journal-id><journal-id journal-id-type="index">7</journal-id><journal-title>JMIR Medical Informatics</journal-title><abbrev-journal-title>JMIR Med Inform</abbrev-journal-title><issn pub-type="epub">2291-9694</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v13i1e80072</article-id><article-id pub-id-type="doi">10.2196/80072</article-id><article-categories><subj-group subj-group-type="heading"><subject>Original Paper</subject></subj-group></article-categories><title-group><article-title>An Intelligent Trial Eligibility Screening Tool Using Natural Language Processing With a Block-Based Visual Programming Interface: Development and Usability Study</article-title></title-group><contrib-group><contrib contrib-type="author"><name name-style="western"><surname>Hu</surname><given-names>Ya-Han</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Cheng</surname><given-names>Yi-Ying</given-names></name><degrees>MIM</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Lan</surname><given-names>Chung-Ching</given-names></name><degrees>MBA</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author" equal-contrib="yes"><name name-style="western"><surname>Su</surname><given-names>Yu-Hsiang</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff3">3</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib><contrib contrib-type="author" corresp="yes" equal-contrib="yes"><name name-style="western"><surname>Sung</surname><given-names>Sheng-Feng</given-names></name><degrees>MD, PhD</degrees><xref ref-type="aff" rid="aff3">3</xref><xref ref-type="aff" rid="aff4">4</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib></contrib-group><aff id="aff1"><institution>Department of Information Management, National Central University</institution><addr-line>Taoyuan</addr-line><country>Taiwan</country></aff><aff id="aff2"><institution>Asian Institute for Impact Measurement and Management, National Central University</institution><addr-line>Taoyuan</addr-line><country>Taiwan</country></aff><aff id="aff3"><institution>Division of Neurology, Department of Internal Medicine, Ditmanson Medical Foundation Chia-Yi Christian Hospital</institution><addr-line>539 Zhongxiao Road, East District</addr-line><addr-line>Chiayi City</addr-line><country>Taiwan</country></aff><aff id="aff4"><institution>Department of Nursing, Fooyin University</institution><addr-line>Kaohsiung</addr-line><country>Taiwan</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Coristine</surname><given-names>Andrew</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Chrimes</surname><given-names>Dillon</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Sharma</surname><given-names>Priyanshu</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Sheng-Feng Sung, MD, PhD, Division of Neurology, Department of Internal Medicine, Ditmanson Medical Foundation Chia-Yi Christian Hospital, 539 Zhongxiao Road, East District, Chiayi City, 60002, Taiwan, +886-5-2765041 ext 8655; <email>richard.sfsung@gmail.com</email></corresp><fn fn-type="equal" id="equal-contrib1"><label>*</label><p>these authors contributed equally</p></fn></author-notes><pub-date pub-type="collection"><year>2025</year></pub-date><pub-date pub-type="epub"><day>11</day><month>12</month><year>2025</year></pub-date><volume>13</volume><elocation-id>e80072</elocation-id><history><date date-type="received"><day>04</day><month>07</month><year>2025</year></date><date date-type="rev-recd"><day>27</day><month>11</month><year>2025</year></date><date date-type="accepted"><day>27</day><month>11</month><year>2025</year></date></history><copyright-statement>&#x00A9; Ya-Han Hu, Yi-Ying Cheng, Chung-Ching Lan, Yu-Hsiang Su, Sheng-Feng Sung. Originally published in JMIR Medical Informatics (<ext-link ext-link-type="uri" xlink:href="https://medinform.jmir.org">https://medinform.jmir.org</ext-link>), 11.12.2025. </copyright-statement><copyright-year>2025</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Informatics, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://medinform.jmir.org/">https://medinform.jmir.org/</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://medinform.jmir.org/2025/1/e80072"/><abstract><sec><title>Background</title><p>Clinical trial eligibility screening using electronic medical records (EMRs) is challenging due to the complexity of patient data and the varied clinical terminologies. Manual screening is time-consuming, requires specialized knowledge, and can lead to inconsistent participant selection, potentially compromising patient safety and research outcomes. This is critical in time-sensitive conditions like acute ischemic stroke. While computerized clinical decision support tools offer solutions, most require software engineering expertise to update, limiting their practical utility when eligibility criteria change.</p></sec><sec><title>Objective</title><p>We developed and evaluated the intelligent trial eligibility screening tool (iTEST), which combines natural language processing with a block-based visual programming interface designed to enable clinicians to create and modify eligibility screening rules independently. In this study, we assessed iTEST&#x2019;s rule evaluation module using pre-configured rules and compared its effectiveness with that of standard EMR interfaces.</p></sec><sec sec-type="methods"><title>Methods</title><p>We conducted an experiment at a tertiary teaching hospital in Taiwan with 12 clinicians using a 2-period crossover design. The clinicians assessed the eligibility of 4 patients with stroke for 2 clinical trials using both standard EMR and iTEST in a counterbalanced order, resulting in 48 evaluation scenarios. The iTEST comprised a rule authoring module using Google Blockly and a rule evaluation module utilizing MetaMap Lite for extracting medical concepts from unstructured EMR documents and structured laboratory data. Primary outcomes included accuracy in determining eligibility. Secondary outcomes measured task completion time, cognitive workload using the National Aeronautics and Space Administration Task Load Index scale (range 0&#x2010;100, with lower scores indicating a lower cognitive workload), and system usability through the system usability scale (range: 0&#x2010;100, with higher scores indicating higher system usability).</p></sec><sec sec-type="results"><title>Results</title><p>The iTEST significantly improved accuracy scores (from 0.91 to 1.00, <italic>P</italic>&#x003C;.001) and reduced completion time (from 3.18 to 2.44 min, <italic>P</italic>=.004) compared to the standard EMR interface. Users reported lower cognitive workload (National Aeronautics and Space Administration Task Load Index scale, 39.7 vs 62.8, <italic>P</italic>=.02) and higher system usability scale scores (71.3 vs 46.3, <italic>P</italic>=.01) with the iTEST. Particularly notable improvements in perceived cognitive workload were observed in temporal demand, effort, and frustration levels.</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>The iTEST demonstrated superior performance in clinical trial eligibility screening, delivering improved accuracy, reduced completion time, lower cognitive workload, and better usability when evaluating preconfigured eligibility rules. The improved accuracy is critical for patient safety, as the misidentification of eligibility criteria could expose patients to inappropriate treatments or exclude them from beneficial trials. The adaptability and ability of the iTEST to process both structured and unstructured data make it valuable for time-sensitive scenarios and evolving research protocols. Future research should evaluate clinicians&#x2019; ability to create and modify eligibility rules using the block-based authoring interface, as well as assess the iTEST across diverse types of clinical trials and health care settings.</p></sec></abstract><kwd-group><kwd>block-based visual programming</kwd><kwd>clinical decision support</kwd><kwd>clinical trials</kwd><kwd>electronic medical records</kwd><kwd>eligibility screening</kwd><kwd>natural language processing</kwd><kwd>patient safety</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>Clinical trials follow strict criteria for participant selection, using documented medical records as essential information sources. Over time, electronic medical records (EMRs) have evolved into comprehensive data repositories, enabling health care providers to track information systematically [<xref ref-type="bibr" rid="ref1">1</xref>-<xref ref-type="bibr" rid="ref3">3</xref>]. However, the increased volume and complexity of EMRs offer a detailed view of patient histories while posing challenges for researchers analyzing this wealth of data.</p><p>The complexity of EMRs demands extensive time and effort from researchers to analyze documents. Addressing EMR-related cognitive overload and burnout is now critical [<xref ref-type="bibr" rid="ref4">4</xref>]. Researchers face tight deadlines, especially in clinical trials for time-sensitive conditions like stroke or brain injury. The phrase &#x201C;time is brain&#x201D; underscores the urgency for immediate therapy post-onset [<xref ref-type="bibr" rid="ref5">5</xref>,<xref ref-type="bibr" rid="ref6">6</xref>]. Therefore, researchers must rapidly verify inclusion and exclusion criteria [<xref ref-type="bibr" rid="ref7">7</xref>,<xref ref-type="bibr" rid="ref8">8</xref>]. Accurately extracting relevant information from EMRs is also essential for participant eligibility; violations could compromise trial validity and harm participants. This heavy workload increases mental stress and risks judgment errors among clinical researchers.</p><p>To address these challenges, using computerized clinical decision support tools in trial eligibility screening offers a promising solution [<xref ref-type="bibr" rid="ref9">9</xref>]. These systems can efficiently process EMRs, enabling rapid candidate screening. However, EMRs contain a significant amount of unstructured narrative text, with about 80% being narrative&#x2014;a format clinicians prefer for patient information [<xref ref-type="bibr" rid="ref10">10</xref>]. These unstructured data complicate medical concept extraction automation. The widespread use of synonyms, acronyms, and abbreviations in clinical documentation further complicates matters, making conventional natural language processing (NLP) techniques often inadequate and necessitating specialized medical NLP tools.</p><p>Our previous study developed an NLP-enhanced task-specific EMR interface that presented relevant medical concepts to clinicians through highlighted documents for determining intravenous thrombolysis eligibility criteria [<xref ref-type="bibr" rid="ref11">11</xref>]. The results showed that this EMR interface improved decision-making in stroke therapy. However, creating entirely new systems with specific rules for each clinical problem remains challenging. Clinical trial or therapy eligibility criteria often evolve as new evidence emerges [<xref ref-type="bibr" rid="ref12">12</xref>]. Current approaches require software engineers to update rules or build new systems whenever clinical guidelines or criteria change, raising costs [<xref ref-type="bibr" rid="ref13">13</xref>]. Therefore, there is considerable room for improving the design of such tools.</p><p>This study aimed to develop an intelligent trial eligibility screening tool (iTEST) adaptable to various medical scenarios, particularly where eligibility criteria frequently change. By identifying common patterns in eligibility criteria and using a block-based visual programming interface, our tool enables clinicians to create computerized eligibility rules independently, without requiring software engineering expertise. We conducted experiments to evaluate the tool&#x2019;s impact on users&#x2019; accuracy, efficiency, and cognitive workload during eligibility determination.</p></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Study Setting</title><p>This study was conducted at Ditmanson Medical Foundation Chia-Yi Christian Hospital, a 1000-bed tertiary teaching hospital in southern Taiwan, which has a certified comprehensive stroke center managing approximately 650 stroke admissions annually. We evaluated 2 sets of eligibility criteria: the first set for intravenous thrombolysis, adapted from the National Institute of Neurological Disorders and Stroke (NINDS) recombinant tissue-plasminogen activator (rt-PA) trial [<xref ref-type="bibr" rid="ref14">14</xref>], which examined the efficacy of tissue plasminogen activator for acute ischemic stroke, and the second set from the Librexia STROKE trial [<xref ref-type="bibr" rid="ref15">15</xref>], examining milvexian&#x2019;s safety and efficacy in preventing recurrent cerebrovascular events post-acute ischemic stroke or high-risk transient ischemic attack.</p></sec><sec id="s2-2"><title>Ethical Considerations</title><p>The study protocol received formal approval from the Institutional Review Board of Ditmanson Medical Foundation Chia-Yi Christian Hospital (2022102). A unique study identification number replaced patient identifiers to ensure confidentiality. Informed consent was thus exempted. Participants were compensated NTD 3000 (&#x2248;USD 96) for their time and participation.</p></sec><sec id="s2-3"><title>Intelligent Trial Eligibility Screening Tool</title><p><xref ref-type="fig" rid="figure1">Figure 1</xref> illustrates the overview of the iTEST, which has 2 main components: the rule authoring and evaluation modules. In the rule authoring module, users convert narrative eligibility criteria into Blockly blocks [<xref ref-type="bibr" rid="ref16">16</xref>], which are parsed into customized rule expressions and stored in the rule base. The rule evaluation module extracts structured laboratory data from EMRs and maps medical concepts from unstructured EMR documents using MetaMap Lite [<xref ref-type="bibr" rid="ref17">17</xref>]. The inference engine then determines eligibility for each criterion by matching the extracted information to the rule base, and the tool presents users with rule-matching results.</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>Overview of the intelligent trial eligibility screening tool (iTEST), which comprises a rule authoring module (upper part) and a rule evaluation module (lower part). EMR: electronic medical record.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v13i1e80072_fig01.png"/></fig><p>The rule authoring module (upper part of <xref ref-type="fig" rid="figure1">Figure 1</xref>) creates, edits, and versions the eligibility criteria checklist using a block-based visual programming interface powered by Blockly (version 10.4.3; Google) [<xref ref-type="bibr" rid="ref16">16</xref>]. This method, commonly used in programming education, provides visual cues and drag-and-drop functionality while avoiding invalid block combinations. Our study developed customized rule expressions that represent medical concepts and laboratory items in a machine-readable format. Users can easily convert human-written checklist criteria into rule expressions by creating criterion blocks. For numerical laboratory data, criterion blocks allow users to input laboratory items to define conditions (eg, &#x201C;Platelets &#x003C;100,000&#x201D;). For unstructured documents, criterion blocks enable users to specify multiple medical concepts and select EMR document types. Time conditions can be added by using temporal blocks that perform date calculations on EMR timestamp fields (<xref ref-type="fig" rid="figure2">Figure 2</xref>), while logical operators such as AND can combine blocks, which execute separate queries across EMR documents, to express complex criteria like &#x201C;Having a headache or head injury within three years&#x201D; or &#x201C;diabetes with prior stroke in the past.&#x201D; The module translates these blocks into machine-readable rule expressions, enhancing the readability of eligibility criteria and making it easier for nonprogrammers to understand. This module thus enables clinicians to develop complex eligibility rules without requiring programming skills.</p><fig position="float" id="figure2"><label>Figure 2.</label><caption><p>An example showing how Blockly blocks are converted into machine-readable rule expressions.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v13i1e80072_fig02.png"/></fig><p>The rule evaluation module (lower part of <xref ref-type="fig" rid="figure1">Figure 1</xref>) processes 2 data types. It reads numerical laboratory data in tabular format and uses MetaMap Lite (3.6.2rc8 binary only version; U.S. National Library of Medicine) to extract medical concepts from unstructured EMR documents. MetaMap Lite [<xref ref-type="bibr" rid="ref17">17</xref>], a faster version of MetaMap [<xref ref-type="bibr" rid="ref18">18</xref>], maps concepts using the Unified Medical Language System Metathesaurus and assigns Unified Medical Language System concept unique identifiers to annotated concepts [<xref ref-type="bibr" rid="ref17">17</xref>]. It generates a list of concepts from EMR documents, discarding irrelevant ones based on semantic type settings. Additionally, it addresses challenges like complex concepts with multiple synonyms and potential misinterpretation of word context variations.</p><p>As an internal validation, we evaluated MetaMap Lite&#x2019;s ability to identify medical concepts related to the eligibility criteria examined in this study. We randomly selected 61 documents from 20 patients in a validation dataset separate from the one used for rule development. Two independent expert clinicians manually reviewed and annotated each document to establish a gold-standard reference, resolving disagreements through discussion and consensus. Precision and recall were calculated by comparing MetaMap Lite&#x2019;s automated extractions with the gold-standard annotations for each eligibility concept. Table S1 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> displays the results, showing high precision and recall for most of the related concepts.</p><p>The inference engine analyzes the extracted information against the rule base to evaluate eligibility for each criterion. A web-based interface displays the rule-matching results, allowing users to review the eligibility criteria checklist with links to annotated EMR documents, highlighting key concepts for review (<xref ref-type="fig" rid="figure3">Figure 3</xref>).</p><fig position="float" id="figure3"><label>Figure 3.</label><caption><p>The intelligent trial eligibility screening tool (iTEST) interface. The left panel displays a trial eligibility criteria checklist, with each criterion marked yes or no based on the patient&#x2019;s data. The upper right panel features 2 tabs: one for clinical documents and one for numerical laboratory data. A red dot marks documents with relevant information. The lower right panel shows the content of the selected clinical document, highlighting key medical concepts for easy reference.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v13i1e80072_fig03.png"/></fig></sec><sec id="s2-4"><title>User Experiment</title><p>We conducted a user experiment to assess users&#x2019; accuracy, efficiency, and perceived workload in determining eligibility. A total of 12 clinicians participated in the study, using either a standard EMR interface or the iTEST on a desktop computer to complete eligibility criteria checklists for the NINDS rt-PA and Librexia STROKE trials. Participation was voluntary and compensated.</p><p>The experiment used a 2-period crossover design to compare the effectiveness of the iTEST with a standard EMR interface. Each user evaluated 4 patients&#x2014;2 with the iTEST and 2 with the standard EMR&#x2014;resulting in 48 scenarios (<xref ref-type="fig" rid="figure4">Figure 4A</xref>). We set the participant count at 12 to ensure each patient appeared 6 times in both testing scenarios.</p><fig position="float" id="figure4"><label>Figure 4.</label><caption><p>A 2-period crossover design for the user experiment (A). Procedures of the user experiment (B). EMR: electronic medical record; NASA-TLX: National Aeronautics and Space Administration Task Load Index; rt-PA: recombinant tissue-plasminogen activator; SUS: system usability scale.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v13i1e80072_fig04.png"/></fig><p>The 4 cases chosen for this study are actual patients with stroke from our hospital. They have complex histories, detailed records across multiple departments, and several treatment contraindications. Some critical contraindications are only documented in less prominent sections, like outpatient notes, making them harder to identify quickly during assessment. To prevent overfitting and ensure an unbiased evaluation, the 4 cases were held out from the datasets used for the development or internal validation of the eligibility extraction rules.</p><p>At the experiment&#x2019;s start, each user received a detailed introduction to procedures (<xref ref-type="fig" rid="figure4">Figure 4B</xref>) and 10 minutes of iTEST training. A study coordinator managed the process and recorded time points. In period 1, users utilized either the standard EMR interface or the iTEST, switching to the other in period 2. During each period, users evaluated eligibility for 2 patients, first for the rt-PA checklist and then for the milvexian checklist. After evaluations, they assessed cognitive workload using the National Aeronautics and Space Administration Task Load Index (NASA-TLX) scale [<xref ref-type="bibr" rid="ref19">19</xref>]. At the end of each period, they provided overall usability feedback through the system usability scale (SUS) questionnaire [<xref ref-type="bibr" rid="ref20">20</xref>].</p></sec><sec id="s2-5"><title>Outcomes</title><p>The primary outcome measured response accuracy to the eligibility checklist. For each patient, users completed checklists for 2 trials (Tables S2 and S3 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). At least 2 senior neurologists (YHS and SFS) with extensive stroke care experience established reference answers by consensus, against which user responses were marked as correct or incorrect. Each correct response earned 1 point, and the final accuracy score (maximum=1) for each checklist was the average of the points of all criteria in that checklist.</p><p>Secondary outcomes included checklist completion time, cognitive workload (measured by the NASA-TLX scale), and tool usability (measured by the SUS). The NASA-TLX assesses 2 dimensions of subjective workload: mental demand, physical demand, temporal demand, performance, effort, and frustration [<xref ref-type="bibr" rid="ref19">19</xref>], rated from 0 to 20, with higher scores indicating greater cognitive workload. Ratings are weighted to produce a total score from 0 to 100. The SUS evaluates interface usability via a 10-item Likert scale questionnaire (from strongly agree to strongly disagree), assessing factors including support needs, training requirements, complexity, integration, ease of learning, and user confidence [<xref ref-type="bibr" rid="ref20">20</xref>]. SUS scores range from 0 to 100, with higher scores indicating better usability. A prior study showed that adjective ratings of &#x201C;poor,&#x201D; &#x201C;OK,&#x201D; and &#x201C;good&#x201D; corresponded to average SUS scores of 35.7, 50.9, and 71.4, respectively [<xref ref-type="bibr" rid="ref21">21</xref>].</p><p>In addition to the above planned analyses comparing overall performance between the standard EMR interface and the iTEST, we conducted exploratory subgroup analyses examining each treatment protocol (rt-PA and milvexian) separately to provide more detailed insights into system performance across different clinical scenarios.</p></sec><sec id="s2-6"><title>Statistical Analysis</title><p>Given the small sample size in the user experiment and the non-normal distribution of the outcome measures, we reported the outcome measures as medians with interquartile ranges and conducted nonparametric analyses. The iTEST and the standard EMR interface were compared using the Wilcoxon signed-rank test for repeated user measurements. Two-tailed <italic>P</italic> values &#x003C;.05 were considered statistically significant. Analyses were performed using R version 4.4.0 (R Foundation for Statistical Computing).</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>User Statistics</title><p><xref ref-type="table" rid="table1">Table 1</xref> summarizes participant characteristics. The study included 6 physicians and 6 nurse practitioners. The participants, who were evenly split between male and female participants, had a mean age of 41 years and varied widely in experience levels across clinical practice, EMR use, personal computer use, and stroke care. The median clinical experience was 14.5 years, and they used the standard EMR interface for a median of 7 years.</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>User characteristics.</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom" rowspan="2">User</td><td align="left" valign="bottom" rowspan="2">Age (y)</td><td align="left" valign="bottom" rowspan="2">Gender</td><td align="left" valign="bottom" rowspan="2">Profession</td><td align="left" valign="bottom" colspan="4">Experience (y)</td></tr><tr><td align="left" valign="bottom">Clinical practice</td><td align="left" valign="bottom">EMR<sup><xref ref-type="table-fn" rid="table1fn1">a</xref></sup> use</td><td align="left" valign="bottom">PC<sup><xref ref-type="table-fn" rid="table1fn2">b</xref></sup> use</td><td align="left" valign="bottom">Stroke care</td></tr></thead><tbody><tr><td align="left" valign="top">#1</td><td align="left" valign="top">34</td><td align="left" valign="top">Male</td><td align="left" valign="top">Physician</td><td align="left" valign="top">7</td><td align="left" valign="top">5</td><td align="left" valign="top">7</td><td align="left" valign="top">1</td></tr><tr><td align="left" valign="top">#2</td><td align="left" valign="top">46</td><td align="left" valign="top">Female</td><td align="left" valign="top">NP<sup><xref ref-type="table-fn" rid="table1fn3">c</xref></sup></td><td align="left" valign="top">25</td><td align="left" valign="top">15</td><td align="left" valign="top">30</td><td align="left" valign="top">5</td></tr><tr><td align="left" valign="top">#3</td><td align="left" valign="top">51</td><td align="left" valign="top">Female</td><td align="left" valign="top">NP</td><td align="left" valign="top">27</td><td align="left" valign="top">9</td><td align="left" valign="top">30</td><td align="left" valign="top">16</td></tr><tr><td align="left" valign="top">#4</td><td align="left" valign="top">39</td><td align="left" valign="top">Female</td><td align="left" valign="top">NP</td><td align="left" valign="top">10</td><td align="left" valign="top">10</td><td align="left" valign="top">20</td><td align="left" valign="top">16</td></tr><tr><td align="left" valign="top">#5</td><td align="left" valign="top">40</td><td align="left" valign="top">Female</td><td align="left" valign="top">NP</td><td align="left" valign="top">20</td><td align="left" valign="top">8</td><td align="left" valign="top">20</td><td align="left" valign="top">3</td></tr><tr><td align="left" valign="top">#6</td><td align="left" valign="top">32</td><td align="left" valign="top">Male</td><td align="left" valign="top">Physician</td><td align="left" valign="top">8</td><td align="left" valign="top">7</td><td align="left" valign="top">15</td><td align="left" valign="top">1</td></tr><tr><td align="left" valign="top">#7</td><td align="left" valign="top">40</td><td align="left" valign="top">Male</td><td align="left" valign="top">Physician</td><td align="left" valign="top">14</td><td align="left" valign="top">6</td><td align="left" valign="top">25</td><td align="left" valign="top">6</td></tr><tr><td align="left" valign="top">#8</td><td align="left" valign="top">35</td><td align="left" valign="top">Male</td><td align="left" valign="top">Physician</td><td align="left" valign="top">10</td><td align="left" valign="top">3</td><td align="left" valign="top">25</td><td align="left" valign="top">3</td></tr><tr><td align="left" valign="top">#9</td><td align="left" valign="top">41</td><td align="left" valign="top">Male</td><td align="left" valign="top">Physician</td><td align="left" valign="top">15</td><td align="left" valign="top">1</td><td align="left" valign="top">22</td><td align="left" valign="top">15</td></tr><tr><td align="left" valign="top">#10</td><td align="left" valign="top">43</td><td align="left" valign="top">Male</td><td align="left" valign="top">Physician</td><td align="left" valign="top">16</td><td align="left" valign="top">12</td><td align="left" valign="top">20</td><td align="left" valign="top">16</td></tr><tr><td align="left" valign="top">#11</td><td align="left" valign="top">40</td><td align="left" valign="top">Female</td><td align="left" valign="top">NP</td><td align="left" valign="top">18</td><td align="left" valign="top">7</td><td align="left" valign="top">22</td><td align="left" valign="top">2</td></tr><tr><td align="left" valign="top">#12</td><td align="left" valign="top">48</td><td align="left" valign="top">Female</td><td align="left" valign="top">NP</td><td align="left" valign="top">7</td><td align="left" valign="top">7</td><td align="left" valign="top">7</td><td align="left" valign="top">3</td></tr></tbody></table><table-wrap-foot><fn id="table1fn1"><p><sup>a</sup>EMR: electronic medical record.</p></fn><fn id="table1fn2"><p><sup>b</sup>PC: personal computer.</p></fn><fn id="table1fn3"><p><sup>c</sup>NP: nurse practitioner.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s3-2"><title>Computational Performance</title><p>To evaluate the iTEST&#x2019;s computational performance, we measured processing time using EMRs from 15 patients with different documentation volumes. The number of clinical notes per patient ranged from 417 to 7299. System processing time (measured from patient selection to the full display of MetaMap Lite-analyzed clinical notes) varied from 6 to 345 seconds (average: 39 ms per note). This processing represents an initial computational overhead when a patient is first loaded; the subsequent evaluation of multiple eligibility criteria requires no extra processing time. In our clinical workflow, iTEST processing begins at patient triage in the emergency department, ensuring that all EMR analyses are completed before clinicians assess trial eligibility.</p></sec><sec id="s3-3"><title>Evaluation Outcomes</title><p><xref ref-type="table" rid="table2">Table 2</xref> compares the outcomes of the standard EMR interface with the iTEST. Users attained a median accuracy score of 0.91 for the primary outcome using the standard EMR interface. In contrast, the iTEST produced a higher median accuracy score of 1.00, representing a 9.9% improvement with strong statistical significance (<italic>P</italic>&#x003C;.001).</p><table-wrap id="t2" position="float"><label>Table 2.</label><caption><p>Comparisons of outcomes between scenarios using the standard EMR<sup><xref ref-type="table-fn" rid="table2fn1">a</xref></sup> interface and the iTEST.</p></caption><table id="table2" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Outcome</td><td align="left" valign="bottom">Standard EMR interface, median (IQR)</td><td align="left" valign="bottom">iTEST<sup><xref ref-type="table-fn" rid="table2fn2">b</xref></sup>, median (IQR)</td><td align="left" valign="bottom"><italic>P</italic> value</td></tr></thead><tbody><tr><td align="left" valign="top">Accuracy score</td><td align="left" valign="top">0.91 (0.84&#x2010;0.96)</td><td align="left" valign="top">1.00 (0.95&#x2010;1.00)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">Time (min)</td><td align="left" valign="top">3.18 (2.34&#x2010;4.52)</td><td align="left" valign="top">2.44 (1.67&#x2010;3.17)</td><td align="left" valign="top">.004</td></tr><tr><td align="left" valign="top">NASA-TLX<sup><xref ref-type="table-fn" rid="table2fn3">c</xref></sup> score</td><td align="left" valign="top">62.8 (36.7&#x2010;75.8)</td><td align="left" valign="top">39.7 (26.8&#x2010;52.0)</td><td align="left" valign="top">.02</td></tr><tr><td align="left" valign="top">SUS<sup><xref ref-type="table-fn" rid="table2fn4">d</xref></sup> score</td><td align="left" valign="top">46.3 (36.9&#x2010;55.0)</td><td align="left" valign="top">71.3 (56.9&#x2010;75.6)</td><td align="left" valign="top">.01</td></tr></tbody></table><table-wrap-foot><fn id="table2fn1"><p><sup>a</sup>EMR: electronic medical record.</p></fn><fn id="table2fn2"><p><sup>b</sup>iTEST: intelligent trial eligibility screening tool.</p></fn><fn id="table2fn3"><p><sup>c</sup>NASA-TLX: National Aeronautics and Space Administration Task Load Index.</p></fn><fn id="table2fn4"><p><sup>d</sup>SUS: system usability scale.</p></fn></table-wrap-foot></table-wrap><p>Tables S2 and S3 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> display the average accuracy scores of all 12 users for each eligibility criterion. With the standard EMR interface, accuracy scores ranged from 0.54 to 1.00, while the iTEST improved this range to 0.75 to 1.00. Users particularly struggled with certain criteria while using the standard interface, including identifying a diabetes history along with a prior stroke, internal bleeding within the last 3 months, and an activated prothrombin time of &#x2264;1.4 times the control value within 7 days. For these challenging criteria, accuracy scores dropped below 0.60 with the standard interface but improved to at least 0.75 with the iTEST.</p><p>For secondary outcomes, the iTEST reduced task completion time by 0.74 minutes (23.3% reduction; from 3.18 to 2.44 min; <italic>P</italic>=.004) compared with the standard EMR interface. Users reported a 23.1-point reduction in NASA-TLX scores (36.8% decrease; from 62.8 to 39.7; <italic>P</italic>=.02), indicating substantial improvement in perceived cognitive demand. The SUS scores improved by 25 points (54% increase; from 46.3 to 71.3; <italic>P</italic>=.01), moving the system from the &#x201C;POOR to OK&#x201D; category to the &#x201C;OK to GOOD&#x201D; category and exceeding the acceptability threshold [<xref ref-type="bibr" rid="ref21">21</xref>].</p><p><xref ref-type="table" rid="table3">Table 3</xref> presents the scores for each NASA-TLX subscale. Among the 6 dimensions of cognitive workload, mental demand, temporal demand, and effort received higher scores than physical demand, performance, and frustration. Participants reported significant reductions in temporal demand, effort, and frustration when using the iTEST as opposed to the standard EMR interface.</p><table-wrap id="t3" position="float"><label>Table 3.</label><caption><p>Comparisons of NASA-TLX<sup><xref ref-type="table-fn" rid="table3fn1">a</xref></sup> subscales between scenarios using the standard EMR<sup><xref ref-type="table-fn" rid="table3fn2">b</xref></sup> interface and the iTEST<sup><xref ref-type="table-fn" rid="table3fn3">c</xref></sup>.</p></caption><table id="table3" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">NASA-TLX subscale</td><td align="left" valign="bottom">Standard EMR interface, median (IQR)</td><td align="left" valign="bottom">iTEST, median (IQR)</td><td align="left" valign="bottom"><italic>P</italic> value</td></tr></thead><tbody><tr><td align="left" valign="top">Mental demand</td><td align="left" valign="top">13.5 (10.0&#x2010;16.6)</td><td align="left" valign="top">10.0 (6.8&#x2010;14.3)</td><td align="left" valign="top">.13</td></tr><tr><td align="left" valign="top">Physical demand</td><td align="left" valign="top">10.0 (6.8&#x2010;13.0)</td><td align="left" valign="top">7.0 (4.4&#x2010;10.0)</td><td align="left" valign="top">.18</td></tr><tr><td align="left" valign="top">Temporal demand</td><td align="left" valign="top">14.0 (10.0&#x2010;17.6)</td><td align="left" valign="top">9.0 (4.9&#x2010;11.5)</td><td align="left" valign="top">.007</td></tr><tr><td align="left" valign="top">Performance</td><td align="left" valign="top">7.0 (2.0&#x2010;10.5)</td><td align="left" valign="top">3.8 (2.0&#x2010;5.3)</td><td align="left" valign="top">.10</td></tr><tr><td align="left" valign="top">Effort</td><td align="left" valign="top">14.0 (10.0&#x2010;17.6)</td><td align="left" valign="top">9.0 (4.4&#x2010;14.0)</td><td align="left" valign="top">.02</td></tr><tr><td align="left" valign="top">Frustration</td><td align="left" valign="top">7.5 (3.5&#x2010;10.0)</td><td align="left" valign="top">4.3 (1.0&#x2010;8.0)</td><td align="left" valign="top">.02</td></tr></tbody></table><table-wrap-foot><fn id="table3fn1"><p><sup>a</sup>NASA-TLX: National Aeronautics and Space Administration Task Load Index.</p></fn><fn id="table3fn2"><p><sup>b</sup>EMR: electronic medical record.</p></fn><fn id="table3fn3"><p><sup>c</sup>iTEST: intelligent trial eligibility screening tool.</p></fn></table-wrap-foot></table-wrap><p>The results of the exploratory subgroup analysis, which compares the outcomes for each checklist individually, are listed in Table S4 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. For the rt-PA checklist, the accuracy score significantly improved from 0.91 to 1.00 (<italic>P</italic>=.001) using the iTEST. However, no significant differences were observed in task completion time or NASA-TLX scores. In contrast, the iTEST significantly improved all outcomes for the milvexian checklist.</p></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Principal Results</title><p>This study demonstrated that the iTEST outperformed the standard EMR interface in multiple ways. It improved the accuracy of determining trial eligibility criteria while enhancing efficiency through shorter task completion time. The iTEST also significantly reduced users&#x2019; cognitive workload and offered better usability than the standard interface.</p></sec><sec id="s4-2"><title>Accuracy of Eligibility Screening</title><p>The iTEST showed significant improvements over the standard EMR interface. It enhanced accuracy in identifying both numerical laboratory data and textual information in clinical documents. For instance, for the milvexian checklist, the accuracy score for &#x201C;APTT&#x2264;1.4 times control&#x201D; increased markedly from 0.54 to 0.92 (Table S3 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). This improvement likely occurred because the standard EMR lacks automated rule checking, requiring users to perform mental or manual calculations of numerical values.</p><p>The iTEST also improved accuracy when determining eligibility criteria using textual information. For instance, for the rt-PA checklist, users often misidentified patients with &#x201C;diabetes with prior stroke,&#x201D; achieving only a 0.54 accuracy score. This low score likely arose from the complexity of the assessments needing both laboratory data and clinical narratives. Extensive medical histories can obscure crucial diagnostic evidence, leading to medical errors [<xref ref-type="bibr" rid="ref22">22</xref>]. This is a common challenge for clinical researchers working with large, complex medical records&#x2014;even in electronic form, the human brain struggles to identify key concepts quickly [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref24">24</xref>]. The iTEST addressed this challenge by extracting and highlighting essential information in clinical documents, thereby improving eligibility screening accuracy from 0.54 to 0.75 (Table S2 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). However, the suboptimal accuracy (0.75) underscores the challenge of linking temporal relationships between conditions documented across multiple clinical notes. This limitation affects both automated systems and human reviewers due to cognitive load and fragmented information in medical records.</p><p>While the iTEST performed well overall in clinical trial screening, our NLP validation (Table S1 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>) revealed issues with key concept extraction. Notably, &#x201C;Anticoagulant&#x201D; detection (F<sub>1</sub>-score=0.33) was poor, mainly due to nonstandard negation expressions that caused false positives and incomplete concept mapping, leading to missing specific anticoagulants. We refined the process by adding 5 anticoagulants (warfarin, apixaban, dabigatran, edoxaban, rivaroxaban), greatly improving accuracy. This workaround, however, highlights a significant limitation of MetaMap Lite&#x2019;s concept generalization and ontology depth for broad drug classes; the tool failed to effectively handle a critical, broad safety concept without explicit enumeration of individual drugs. This highlights the need for concept validation and iterative refinement in NLP tools for critical criteria.</p><p>Furthermore, using MetaMap Lite instead of the full MetaMap may result in less effective concept extraction. While faster and lighter, MetaMap Lite implements only a subset of MetaMap&#x2019;s extensive options and lacks sophisticated word-sense disambiguation modules, which can result in mapping all available senses of a term and generating false positives [<xref ref-type="bibr" rid="ref17">17</xref>]. The failure to generalize the anticoagulant concept exemplifies this limitation. Specifically, MetaMap Lite&#x2019;s shallower ontology proved inadequate for managing hierarchical drug class relationships essential for safety screening. Although suitable for resource-limited or real-time applications, high-accuracy tasks are better served by the full MetaMap, emphasizing the trade-off between speed and depth.</p><p>Therefore, we recommend that clinical implementations of the iTEST include a validation phase where each new eligibility criterion is tested against a small set of annotated medical records before deployment. This quality assurance step can identify concept-mapping issues and help refine the process, especially for critical safety&#x2212;related criteria such as anticoagulant use. Furthermore, despite the iTEST achieving a median accuracy of 1.00, the relatively lower accuracy on critical, complex criteria such as &#x201C;diabetes with prior stroke&#x201D; still indicates a high-risk failure mode that the iTEST did not fully address.</p></sec><sec id="s4-3"><title>Efficiency and Usability</title><p>Even though users were trying the iTEST for the first time, they completed eligibility screening significantly faster after just a 10-minute training session. Users took a median of 2.44 minutes with the iTEST compared to 3.18 minutes with the standard EMR interface (<xref ref-type="table" rid="table2">Table 2</xref>) despite having years of experience with the latter. Notably, when analyzing individual checklists, the rt-PA checklist showed no significant improvement in completion time. This likely occurred because users were already highly familiar with checking eligibility criteria for intravenous thrombolysis (similar to those of the NINDS rt-PA trial) in their daily clinical practice before the study. Additionally, our study might have been underpowered to detect these smaller effects on familiar tasks, unlike the significant improvements seen across all metrics for the unfamiliar milvexian checklist.</p><p>With users achieving higher accuracy in less time during eligibility screening, it is unsurprising that the iTEST demonstrated better system usability than the standard EMR interface. The SUS score of 71.3 represents acceptable usability in the &#x201C;OK to GOOD&#x201D; range, indicating meaningful improvement over the standard EMR (46.3) but also suggesting room for further optimization. Despite being new to users and having received only 10 minutes of training, the iTEST demonstrated reasonable ease of use for this specific task. Research has shown that EMR systems should incorporate ongoing physician feedback to enhance usability, as poor EMR design can negatively impact physicians&#x2019; well-being and increase their perceived workload [<xref ref-type="bibr" rid="ref25">25</xref>]. Consistent with these findings, the iTEST not only improved system usability but also reduced the perceived cognitive workload.</p></sec><sec id="s4-4"><title>Cognitive Workload</title><p>The iTEST significantly outperformed the standard EMR interface in overall NASA-TLX scores. While some researchers question the mathematical validity of combining the 6 NASA-TLX dimensions into a single workload score [<xref ref-type="bibr" rid="ref26">26</xref>], we analyzed both the overall and individual dimensions (<xref ref-type="table" rid="table3">Table 3</xref>). The most substantial improvements were observed in temporal demand (from 14.0 to 9.0, <italic>P</italic>=.007) and effort (from 14.0 to 9.0, <italic>P</italic>=.02), with frustration levels also showing a significant reduction (from 7.5 to 4.3, <italic>P</italic>=.02). The marked reduction in temporal demand aligned with the decreased task completion time, which is crucial since the effectiveness of stroke therapy depends heavily on timing [<xref ref-type="bibr" rid="ref27">27</xref>] and creates substantial pressure for clinicians [<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref29">29</xref>]. While we observed significant improvements in temporal demand, effort, and frustration subscales, reductions in mental demand, physical demand, and performance subscales did not reach statistical significance, possibly due to a limited sample size.</p><p>Few studies have assessed trial eligibility screening workload [<xref ref-type="bibr" rid="ref30">30</xref>,<xref ref-type="bibr" rid="ref31">31</xref>], primarily measuring work volume instead of cognitive burden. To our knowledge, no research has specifically analyzed the cognitive workload of this task. However, studies have compared perceived cognitive workload across different EMR interfaces and visualization tools for various clinical tasks [<xref ref-type="bibr" rid="ref32">32</xref>-<xref ref-type="bibr" rid="ref34">34</xref>], indicating that renovations to the EMR interface can enhance efficiency and reduce cognitive demands.</p></sec><sec id="s4-5"><title>Clinical Implications</title><p>The iTEST improves upon the standard EMR interface with better accuracy and efficiency in eligibility screening, reduced cognitive workload, and enhanced usability, leading to several clinical benefits. Researchers can enroll suitable trial participants more effectively, ensuring scientific validity and data quality while protecting ineligible patients. Additionally, the iTEST enhances patient safety by avoiding unnecessary risks. For instance, the NINDS-rt-PA trial, which examined rt-PA in patients with acute ischemic stroke, highlights the importance of careful patient selection to mitigate serious intracranial bleeding risks [<xref ref-type="bibr" rid="ref35">35</xref>]. The eligibility criteria established by this trial have become the standard for intravenous thrombolysis [<xref ref-type="bibr" rid="ref36">36</xref>]. Consequently, the iTEST can assist clinicians in selecting appropriate patients for therapies, improving routine clinical practice.</p><p>While the iTEST&#x2019;s computational overhead can reach up to 345 seconds for patients with extensive EMR histories, this does not affect time-sensitive clinical decision-making in our workflow. By starting EMR processing at emergency department triage, all computational work is completed before clinicians evaluate trial eligibility. This integration ensures that the iTEST&#x2019;s processing time does not cause delays during the critical acute stroke assessment window. Future implementations in other clinical settings should consider similar workflow integration strategies, and improving MetaMap Lite&#x2019;s performance may further reduce processing times for real-time use.</p><p>This study examined 2 checklists. Users were already familiar with the rt-PA checklist before the study. They still made occasional mistakes, achieving a median accuracy score of 0.91. The iTEST improved this score to 1.00. The milvexian checklist, being new to users, yielded a lower median accuracy score (0.84) than the rt-PA checklist (0.91), highlighting how unfamiliarity with eligibility criteria can lead to more errors. With the iTEST, users achieved nearly perfect accuracy (median score 1.00) for both the familiar rt-PA and unfamiliar milvexian checklist, demonstrating its value over the standard EMR interface, especially for new eligibility checklists. However, the separate analyses of the rt-PA and milvexian checklists were exploratory. While these findings provide valuable insights into protocol-specific performance, they should be interpreted cautiously and confirmed in future prospective studies with predefined hypotheses.</p><p>Cognitive overload is a leading cause of burnout among clinicians [<xref ref-type="bibr" rid="ref4">4</xref>]. When facing burnout, clinicians favor patients with straightforward medical histories, as fewer clinical documents are needed for eligibility determination. They may overlook patients with complex, lengthy medical histories requiring thorough review. This selection bias can compromise clinical trial validity by causing the trial population to deviate from the intended target population. The iTEST addresses this issue by reducing cognitive workload, thus streamlining patient recruitment and minimizing selection bias. This benefit becomes even more pronounced as EMR documentation grows over time.</p><p>Prior research on trial eligibility screening has primarily focused on enhancing recruitment efficiency through the application of NLP and machine learning to EMR data. The foundational work by Ni et al [<xref ref-type="bibr" rid="ref30">30</xref>,<xref ref-type="bibr" rid="ref31">31</xref>] demonstrated substantial workload reductions, with over 90% in pediatric emergency department settings and 85% in pediatric oncology, by leveraging both structured data and unstructured clinical notes. The subsequent development of the Automated Clinical Trial Eligibility Screener [<xref ref-type="bibr" rid="ref9">9</xref>] advanced this work into real-time, prospective screening, achieving a 34% reduction in screening time and an SUS score of 80.0.</p><p>The iTEST extends this foundation by addressing clinician empowerment and cognitive burden through 2 key innovations. First, its block-based visual programming interface enables clinicians to independently author and update screening rules without software engineering support, enhancing adaptability to evolving eligibility criteria. Second, the iTEST demonstrated significant improvements not only in efficiency but also in accuracy and cognitive workload, quantitatively validating its ability to reduce mental burden while maintaining acceptable usability. This positions the iTEST as a clinician-centric solution that enhances both the efficiency and reliability of eligibility screening while reducing clinician burnout.</p></sec><sec id="s4-6"><title>Future Direction</title><p>Clinical notes at our hospital are primarily in English, with very few in Chinese. Therefore, we disregarded the Chinese portions when developing the iTEST. Besides, extracting medical concepts from non-English clinical documents presents significant challenges [<xref ref-type="bibr" rid="ref37">37</xref>]. However, advancements in large language models (LLMs) may help address the challenge of multilingual clinical notes. They could potentially process multilingual clinical notes without explicit translation, reducing information loss. Moreover, LLMs provide promising capabilities that could overcome several limitations of rule-based approaches, such as those used in our study. Their natural language understanding could improve the handling of variations in clinical documentation, context-dependent interpretations, and complex eligibility criteria that require reasoning across multiple data points.</p><p>However, several issues must be addressed before widespread clinical use. First, reliability and consistency remain major challenges [<xref ref-type="bibr" rid="ref38">38</xref>,<xref ref-type="bibr" rid="ref39">39</xref>]. LLMs can produce inconsistent outputs for the same inputs and may generate plausible but incorrect information (&#x201C;hallucinations&#x201D;), which is unacceptable in clinical decisions. Second, computing costs and infrastructure requirements could limit scalability compared to rule-based systems. Third, regulatory compliance presents significant obstacles, as current frameworks require explainable, auditable decision-making processes, but LLM reasoning often lacks transparency. Finally, concerns about data privacy and the need for specialized medical training data require careful consideration [<xref ref-type="bibr" rid="ref40">40</xref>].</p><p>Future hybrid approaches that combine rule-based reliability with LLM flexibility may offer the best solutions [<xref ref-type="bibr" rid="ref41">41</xref>], where LLMs handle complex language understanding and concept extraction [<xref ref-type="bibr" rid="ref42">42</xref>]. Conversely, rule-based systems guarantee consistent application of explicit eligibility criteria. Importantly, such hybrid frameworks can improve explainability by maintaining transparent decision pathways: the rule-based component offers clear, traceable logic for eligibility determinations, while LLM outputs can be limited to produce interpretable explanations for their reasoning processes. In this way, LLMs, with their strong reasoning and summarization abilities, could be useful in various clinical and research scenarios [<xref ref-type="bibr" rid="ref43">43</xref>].</p></sec><sec id="s4-7"><title>Limitations</title><p>This study has several limitations. First, with only 12 clinicians evaluating 4 patients&#x2019; eligibility, the study findings may not reflect real-world scenarios. Furthermore, the small number of participants may lack enough statistical power to detect differences between the groups. Although our study design, with 12 clinicians, was appropriate for identifying medium-to-large differences, we acknowledge that it may have been underpowered to detect smaller, yet potentially clinically important, effects. Despite this limitation, all 4 outcomes achieved statistical significance. Second, the 4 patients chosen for this study may not accurately represent a typical patient population. However, these cases truly demonstrate the difficulties clinicians encounter when trying to retrieve crucial information from traditional EMR systems. In real-world clinical settings, these patients represent a specific group that not only risks misjudgment and possible harm but also presents challenges for clinical trials.</p><p>Third, while our crossover design enhances internal validity through within-subject comparisons, its applicability to real-world recruitment is limited due to the small number of participants and patient scenarios. These may not accurately reflect the diversity of clinical experience, patient complexity, practice patterns, or technological skills across different settings. Real-world implementation involves a wider range of patient presentations, comorbidities, and situations that could impact system performance differently. Future research should test the iTEST in diverse clinical environments with larger samples to better determine its effectiveness for large-scale trial recruitment. Fourth, the controlled experimental setting may not fully capture the time pressures, interruptions, and multitasking demands of actual emergency care that could influence accuracy and efficiency.</p><p>Fifth, the brief 10-minute training and the crossover design could theoretically lead to learning effects [<xref ref-type="bibr" rid="ref44">44</xref>] that may influence our results. Although we counterbalanced the task order to minimize these effects, the crossover design means participants&#x2019; second interface evaluation might have been affected by familiarity with the eligibility screening task itself. However, the counterbalancing of task order should have evenly distributed any such learning effects across conditions [<xref ref-type="bibr" rid="ref45">45</xref>]. Additionally, the short 10-minute training period for the iTEST actually serves as a conservative test of the system&#x2019;s usability. The fact that the iTEST showed superiority despite minimal training strengthens rather than weakens our findings.</p><p>Sixth, we acknowledge that our user study focused exclusively on the rule evaluation module and did not assess clinicians&#x2019; ability to author rules using the block-based interface. Our study design prioritized evaluating whether the system could effectively support the eligibility screening workflow with preconfigured rules, as this represents the most common use case in our target clinical settings. However, we recognize that this does not validate the authoring capabilities.</p><p>Finally, while participants had extensive experience with the standard EMR interface compared to minimal training with the iTEST, we cannot rule out the influence of the novelty effect [<xref ref-type="bibr" rid="ref46">46</xref>] or the Hawthorne [<xref ref-type="bibr" rid="ref47">47</xref>] effect on our results. Participants&#x2019; awareness of being observed and evaluated, along with the novelty of the iTEST interface, may have led to increased attention and improved performance. Future studies with longer training periods, repeated testing, and naturalistic observation could help determine whether the observed benefits persist beyond initial exposure, revealing learning curves for both systems.</p></sec><sec id="s4-8"><title>Conclusions</title><p>In this study, we introduced the iTEST, an innovative NLP-powered clinical decision support tool that uses MetaMap Lite to extract relevant concepts from EMRs. The system design includes a block-based visual programming interface intended to enable clinicians to author and modify eligibility rules independently; however, the usability and effectiveness of this authoring capability were not evaluated in this study and remain objectives for future research. Our user evaluation focused exclusively on the rule evaluation module using preconfigured rules, where the iTEST demonstrated superior accuracy and usability compared to the standard EMR interface, while reducing both task completion time and perceived cognitive workload. The tool&#x2019;s applications can extend beyond clinical trial screening to include the verification of indications and contraindications for specific therapies or interventions. Through these capabilities, the iTEST has the potential to enhance patient safety while easing clinicians&#x2019; cognitive burden. Future research should evaluate clinicians&#x2019; ability to create and modify eligibility rules using the block-based authoring interface to fully validate the system&#x2019;s empowerment objectives and finalize the assessment of the iTEST&#x2019;s intended functionality.</p></sec></sec></body><back><ack><p>The authors thank the Department of Information Technology at Ditmanson Medical Foundation Chia-Yi Christian Hospital for their technical support, which was invaluable in completing this study. During the preparation of this work, the authors used Grammarly to enhance clarity and ensure grammatical accuracy. After using this tool, the authors reviewed and edited the content as needed and took the full responsibility for the content of the published study.</p></ack><notes><sec><title>Funding</title><p>This research was supported in part by the National Science and Technology Council (grant numbers NSTC 113&#x2010;2410-H-008-054, NSTC 112&#x2010;2221-E-705&#x2010;001-MY2, and NSTC 114&#x2010;2221-E-705&#x2010;001-MY2) and the Ditmanson Medical Foundation Chia-Yi Christian Hospital (grant number I112-203).</p></sec><sec><title>Data Availability</title><p>Data and materials for this research are available from the corresponding author upon reasonable request.</p></sec></notes><fn-group><fn fn-type="con"><p>Conceptualization: SFS, YHH, YHS.</p><p>Data curation: CCL, SFS, YHS.</p><p>Formal analysis: CCL, SFS, YHH.</p><p>Supervision: SFS, YHS.</p><p>Writing &#x2013; original draft: CCL, YHH, YYC.</p><p>Writing &#x2013; review &#x0026; editing: CCL, SFS, YHH, YHS, YYC.</p><p>All authors have full access to the data in the study and take responsibility for the integrity and accuracy of the data analysis. YHS (06500@cych.org.tw) and SFS (sfsung@cych.org.tw) are co-corresponding authors for this article.</p></fn><fn fn-type="conflict"><p>None declared.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">iTEST</term><def><p>intelligent trial eligibility screening tool</p></def></def-item><def-item><term id="abb2">LLM</term><def><p>large language model</p></def></def-item><def-item><term id="abb3">NASA-TLX</term><def><p>National Aeronautics and Space Administration Task Load Index</p></def></def-item><def-item><term id="abb4">NINDS</term><def><p>National Institute of Neurological Disorders and Stroke</p></def></def-item><def-item><term id="abb5">EMR</term><def><p> electronic medical record</p></def></def-item><def-item><term id="abb6">NLP</term><def><p> natural language processing</p></def></def-item><def-item><term id="abb7">rt-PA</term><def><p>recombinant tissue-plasminogen activator</p></def></def-item><def-item><term id="abb8">SUS</term><def><p> system usability scale</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lin</surname><given-names>HL</given-names> </name><name name-style="western"><surname>Wu</surname><given-names>DC</given-names> </name><name name-style="western"><surname>Cheng</surname><given-names>SM</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>CJ</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>MC</given-names> </name><name name-style="western"><surname>Cheng</surname><given-names>CA</given-names> </name></person-group><article-title>Association between electronic medical records and healthcare quality</article-title><source>Medicine (Baltimore)</source><year>2020</year><month>07</month><day>31</day><volume>99</volume><issue>31</issue><fpage>e21182</fpage><pub-id pub-id-type="doi">10.1097/MD.0000000000021182</pub-id><pub-id pub-id-type="medline">32756096</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mollart</surname><given-names>L</given-names> </name><name name-style="western"><surname>Newell</surname><given-names>R</given-names> </name><name name-style="western"><surname>Geale</surname><given-names>SK</given-names> </name><name name-style="western"><surname>Noble</surname><given-names>D</given-names> </name><name name-style="western"><surname>Norton</surname><given-names>C</given-names> </name><name name-style="western"><surname>O&#x2019;Brien</surname><given-names>AP</given-names> </name></person-group><article-title>Introduction of patient electronic medical records (EMR) into undergraduate nursing education: an integrated literature review</article-title><source>Nurse Educ Today</source><year>2020</year><month>11</month><volume>94</volume><fpage>104517</fpage><pub-id pub-id-type="doi">10.1016/j.nedt.2020.104517</pub-id><pub-id pub-id-type="medline">32853983</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Li</surname><given-names>R</given-names> </name><name name-style="western"><surname>Niu</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Scott</surname><given-names>SR</given-names> </name><etal/></person-group><article-title>Using electronic medical record data for research in a healthcare information and management systems society (HIMSS) analytics electronic medical record adoption model (EMRAM) stage 7 hospital in Beijing: cross-sectional study</article-title><source>JMIR Med Inform</source><year>2021</year><month>08</month><day>3</day><volume>9</volume><issue>8</issue><fpage>e24405</fpage><pub-id pub-id-type="doi">10.2196/24405</pub-id><pub-id pub-id-type="medline">34342589</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Asgari</surname><given-names>E</given-names> </name><name name-style="western"><surname>Kaur</surname><given-names>J</given-names> </name><name name-style="western"><surname>Nuredini</surname><given-names>G</given-names> </name><etal/></person-group><article-title>Impact of electronic health record use on cognitive load and burnout among clinicians: narrative review</article-title><source>JMIR Med Inform</source><year>2024</year><month>04</month><day>12</day><volume>12</volume><fpage>e55499</fpage><pub-id pub-id-type="doi">10.2196/55499</pub-id><pub-id pub-id-type="medline">38607672</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Fraser</surname><given-names>JF</given-names> </name><name name-style="western"><surname>H&#x00E4;rtl</surname><given-names>R</given-names> </name></person-group><article-title>Even in trauma, time is brain</article-title><source>Crit Care Med</source><year>2008</year><month>10</month><volume>36</volume><issue>10</issue><fpage>2951</fpage><lpage>2952</lpage><pub-id pub-id-type="doi">10.1097/CCM.0b013e31818724f2</pub-id><pub-id pub-id-type="medline">18812808</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mullen</surname><given-names>MT</given-names> </name><name name-style="western"><surname>Chaturvedi</surname><given-names>S</given-names> </name></person-group><article-title>Endovascular thrombectomy</article-title><source>Neurology (ECronicon)</source><year>2017</year><month>05</month><day>30</day><volume>88</volume><issue>22</issue><fpage>2074</fpage><lpage>2075</lpage><pub-id pub-id-type="doi">10.1212/WNL.0000000000003993</pub-id><pub-id pub-id-type="medline">28455385</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Parsons</surname><given-names>M</given-names> </name><name name-style="western"><surname>Spratt</surname><given-names>N</given-names> </name><name name-style="western"><surname>Bivard</surname><given-names>A</given-names> </name><etal/></person-group><article-title>A randomized trial of tenecteplase versus alteplase for acute ischemic stroke</article-title><source>N Engl J Med</source><year>2012</year><month>03</month><day>22</day><volume>366</volume><issue>12</issue><fpage>1099</fpage><lpage>1107</lpage><pub-id pub-id-type="doi">10.1056/NEJMoa1109842</pub-id><pub-id pub-id-type="medline">22435369</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Skolnick</surname><given-names>BE</given-names> </name><name name-style="western"><surname>Maas</surname><given-names>AI</given-names> </name><name name-style="western"><surname>Narayan</surname><given-names>RK</given-names> </name><etal/></person-group><article-title>A clinical trial of progesterone for severe traumatic brain injury</article-title><source>N Engl J Med</source><year>2014</year><month>12</month><day>25</day><volume>371</volume><issue>26</issue><fpage>2467</fpage><lpage>2476</lpage><pub-id pub-id-type="doi">10.1056/NEJMoa1411090</pub-id><pub-id pub-id-type="medline">25493978</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ni</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Bermudez</surname><given-names>M</given-names> </name><name name-style="western"><surname>Kennebeck</surname><given-names>S</given-names> </name><name name-style="western"><surname>Liddy-Hicks</surname><given-names>S</given-names> </name><name name-style="western"><surname>Dexheimer</surname><given-names>J</given-names> </name></person-group><article-title>A real-time automated patient screening system for clinical trials eligibility in an emergency department: design and evaluation</article-title><source>JMIR Med Inform</source><year>2019</year><month>07</month><day>24</day><volume>7</volume><issue>3</issue><fpage>e14185</fpage><pub-id pub-id-type="doi">10.2196/14185</pub-id><pub-id pub-id-type="medline">31342909</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Murdoch</surname><given-names>TB</given-names> </name><name name-style="western"><surname>Detsky</surname><given-names>AS</given-names> </name></person-group><article-title>The inevitable application of big data to health care</article-title><source>JAMA</source><year>2013</year><month>04</month><day>3</day><volume>309</volume><issue>13</issue><fpage>1351</fpage><lpage>1352</lpage><pub-id pub-id-type="doi">10.1001/jama.2013.393</pub-id><pub-id pub-id-type="medline">23549579</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sung</surname><given-names>SF</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>K</given-names> </name><name name-style="western"><surname>Wu</surname><given-names>DP</given-names> </name><name name-style="western"><surname>Hung</surname><given-names>LC</given-names> </name><name name-style="western"><surname>Su</surname><given-names>YH</given-names> </name><name name-style="western"><surname>Hu</surname><given-names>YH</given-names> </name></person-group><article-title>Applying natural language processing techniques to develop a task-specific EMR interface for timely stroke thrombolysis: a feasibility study</article-title><source>Int J Med Inform</source><year>2018</year><month>04</month><volume>112</volume><fpage>149</fpage><lpage>157</lpage><pub-id pub-id-type="doi">10.1016/j.ijmedinf.2018.02.005</pub-id><pub-id pub-id-type="medline">29500013</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Su</surname><given-names>Q</given-names> </name><name name-style="western"><surname>Cheng</surname><given-names>G</given-names> </name><name name-style="western"><surname>Huang</surname><given-names>J</given-names> </name></person-group><article-title>A review of research on eligibility criteria for clinical trials</article-title><source>Clin Exp Med</source><year>2023</year><month>10</month><volume>23</volume><issue>6</issue><fpage>1867</fpage><lpage>1879</lpage><pub-id pub-id-type="doi">10.1007/s10238-022-00975-1</pub-id><pub-id pub-id-type="medline">36602707</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sutton</surname><given-names>RT</given-names> </name><name name-style="western"><surname>Pincock</surname><given-names>D</given-names> </name><name name-style="western"><surname>Baumgart</surname><given-names>DC</given-names> </name><name name-style="western"><surname>Sadowski</surname><given-names>DC</given-names> </name><name name-style="western"><surname>Fedorak</surname><given-names>RN</given-names> </name><name name-style="western"><surname>Kroeker</surname><given-names>KI</given-names> </name></person-group><article-title>An overview of clinical decision support systems: benefits, risks, and strategies for success</article-title><source>NPJ Digit Med</source><year>2020</year><volume>3</volume><issue>1</issue><fpage>17</fpage><pub-id pub-id-type="doi">10.1038/s41746-020-0221-y</pub-id><pub-id pub-id-type="medline">32047862</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><collab>National Institute of Neurological Disorders and Stroke rt-PA Stroke Study Group</collab></person-group><article-title>Tissue plasminogen activator for acute ischemic stroke</article-title><source>N Engl J Med</source><year>1995</year><month>12</month><day>14</day><volume>333</volume><issue>24</issue><fpage>1581</fpage><lpage>1587</lpage><pub-id pub-id-type="doi">10.1056/NEJM199512143332401</pub-id><pub-id pub-id-type="medline">7477192</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Birchansky</surname><given-names>J</given-names> </name><name name-style="western"><surname>Frishman</surname><given-names>WH</given-names> </name></person-group><article-title>Milvexian: a focus on a new oral anticoagulant that targets factor XIa for thromboembolism prophylaxis</article-title><source>Cardiol Rev</source><year>2025</year><volume>33</volume><issue>1</issue><fpage>93</fpage><lpage>97</lpage><pub-id pub-id-type="doi">10.1097/CRD.0000000000000588</pub-id><pub-id pub-id-type="medline">38305253</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Pasternak</surname><given-names>E</given-names> </name><name name-style="western"><surname>Fenichel</surname><given-names>R</given-names> </name><name name-style="western"><surname>Marshall</surname><given-names>AN</given-names> </name></person-group><article-title>Tips for creating a block language with Blockly</article-title><year>2017</year><conf-name>2017 IEEE Blocks and Beyond Workshop (B&#x0026;B)</conf-name><conf-date>Oct 9-10, 2017</conf-date><conf-loc>Raleigh, NC, USA</conf-loc><publisher-name>IEEE</publisher-name><fpage>21</fpage><lpage>24</lpage><pub-id pub-id-type="doi">10.1109/BLOCKS.2017.8120404</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Demner-Fushman</surname><given-names>D</given-names> </name><name name-style="western"><surname>Rogers</surname><given-names>WJ</given-names> </name><name name-style="western"><surname>Aronson</surname><given-names>AR</given-names> </name></person-group><article-title>MetaMap Lite: an evaluation of a new Java implementation of MetaMap</article-title><source>J Am Med Inform Assoc</source><year>2017</year><month>07</month><day>1</day><volume>24</volume><issue>4</issue><fpage>841</fpage><lpage>844</lpage><pub-id pub-id-type="doi">10.1093/jamia/ocw177</pub-id><pub-id pub-id-type="medline">28130331</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Aronson</surname><given-names>AR</given-names> </name><name name-style="western"><surname>Lang</surname><given-names>FM</given-names> </name></person-group><article-title>An overview of MetaMap: historical perspective and recent advances</article-title><source>J Am Med Inform Assoc</source><year>2010</year><volume>17</volume><issue>3</issue><fpage>229</fpage><lpage>236</lpage><pub-id pub-id-type="doi">10.1136/jamia.2009.002733</pub-id><pub-id pub-id-type="medline">20442139</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hart</surname><given-names>SG</given-names> </name></person-group><article-title>NASA-Task load index (NASA-TLX); 20 years later</article-title><source>Proc Hum Factors Ergon Soc Annu Meet</source><year>2006</year><month>10</month><volume>50</volume><issue>9</issue><fpage>904</fpage><lpage>908</lpage><pub-id pub-id-type="doi">10.1177/154193120605000909</pub-id></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Brooke</surname><given-names>J</given-names> </name></person-group><person-group person-group-type="editor"><name name-style="western"><surname>Jordan</surname><given-names>PW</given-names> </name><name name-style="western"><surname>Thomas</surname><given-names>B</given-names> </name><name name-style="western"><surname>McClelland</surname><given-names>IL</given-names> </name><name name-style="western"><surname>Weerdmeester</surname><given-names>B</given-names> </name></person-group><article-title>SUS&#x2014;a quick and dirty usability scale</article-title><source>Usability Evaluation in Industry</source><year>1996</year><access-date>2025-12-09</access-date><publisher-name>CRC Press</publisher-name><fpage>189</fpage><lpage>194</lpage><comment><ext-link ext-link-type="uri" xlink:href="https://digital.ahrq.gov/sites/default/files/docs/survey/systemusabilityscale%2528sus%2529_comp%255B1%255D.pdf">https://digital.ahrq.gov/sites/default/files/docs/survey/systemusabilityscale%2528sus%2529_comp%255B1%255D.pdf</ext-link></comment><pub-id pub-id-type="other">0748404600</pub-id></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bangor</surname><given-names>A</given-names> </name><name name-style="western"><surname>Kortum</surname><given-names>P</given-names> </name><name name-style="western"><surname>Miller</surname><given-names>J</given-names> </name></person-group><article-title>Determining what individual SUS scores mean: adding an adjective rating scale</article-title><source>J Usability Stud</source><year>2009</year><month>05</month><day>1</day><access-date>2025-12-06</access-date><volume>4</volume><issue>3</issue><fpage>114</fpage><lpage>123</lpage><comment><ext-link ext-link-type="uri" xlink:href="https://dl.acm.org/doi/10.5555/2835587.2835589">https://dl.acm.org/doi/10.5555/2835587.2835589</ext-link></comment></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Nijor</surname><given-names>S</given-names> </name><name name-style="western"><surname>Rallis</surname><given-names>G</given-names> </name><name name-style="western"><surname>Lad</surname><given-names>N</given-names> </name><name name-style="western"><surname>Gokcen</surname><given-names>E</given-names> </name></person-group><article-title>Patient safety issues from information overload in electronic medical records</article-title><source>J Patient Saf</source><year>2022</year><month>09</month><day>1</day><volume>18</volume><issue>6</issue><fpage>e999</fpage><lpage>e1003</lpage><pub-id pub-id-type="doi">10.1097/PTS.0000000000001002</pub-id><pub-id pub-id-type="medline">35985047</pub-id></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Nolan</surname><given-names>ME</given-names> </name><name name-style="western"><surname>Cartin-Ceba</surname><given-names>R</given-names> </name><name name-style="western"><surname>Moreno-Franco</surname><given-names>P</given-names> </name><name name-style="western"><surname>Pickering</surname><given-names>B</given-names> </name><name name-style="western"><surname>Herasevich</surname><given-names>V</given-names> </name></person-group><article-title>A multisite survey study of EMR review habits, information needs, and display preferences among medical ICU clinicians evaluating new patients</article-title><source>Appl Clin Inform</source><year>2017</year><month>10</month><volume>8</volume><issue>4</issue><fpage>1197</fpage><lpage>1207</lpage><pub-id pub-id-type="doi">10.4338/ACI-2017-04-RA-0060</pub-id><pub-id pub-id-type="medline">29272901</pub-id></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Clynch</surname><given-names>N</given-names> </name><name name-style="western"><surname>Kellett</surname><given-names>J</given-names> </name></person-group><article-title>Medical documentation: part of the solution, or part of the problem? A narrative review of the literature on the time spent on and value of medical documentation</article-title><source>Int J Med Inform</source><year>2015</year><month>04</month><volume>84</volume><issue>4</issue><fpage>221</fpage><lpage>228</lpage><pub-id pub-id-type="doi">10.1016/j.ijmedinf.2014.12.001</pub-id><pub-id pub-id-type="medline">25547194</pub-id></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Nguyen</surname><given-names>OT</given-names> </name><name name-style="western"><surname>Jenkins</surname><given-names>NJ</given-names> </name><name name-style="western"><surname>Khanna</surname><given-names>N</given-names> </name><etal/></person-group><article-title>A systematic review of contributing factors of and solutions to electronic health record-related impacts on physician well-being</article-title><source>J Am Med Inform Assoc</source><year>2021</year><month>04</month><day>23</day><volume>28</volume><issue>5</issue><fpage>974</fpage><lpage>984</lpage><pub-id pub-id-type="doi">10.1093/jamia/ocaa339</pub-id><pub-id pub-id-type="medline">33517382</pub-id></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bolton</surname><given-names>ML</given-names> </name><name name-style="western"><surname>Biltekoff</surname><given-names>E</given-names> </name><name name-style="western"><surname>Humphrey</surname><given-names>L</given-names> </name></person-group><article-title>The mathematical meaninglessness of the NASA task load index: a level of measurement analysis</article-title><source>IEEE Trans Human-Mach Syst</source><year>2023</year><volume>53</volume><issue>3</issue><fpage>590</fpage><lpage>599</lpage><pub-id pub-id-type="doi">10.1109/THMS.2023.3263482</pub-id></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Catanese</surname><given-names>L</given-names> </name><name name-style="western"><surname>Tarsia</surname><given-names>J</given-names> </name><name name-style="western"><surname>Fisher</surname><given-names>M</given-names> </name></person-group><article-title>Acute ischemic stroke therapy overview</article-title><source>Circ Res</source><year>2017</year><month>02</month><day>3</day><volume>120</volume><issue>3</issue><fpage>541</fpage><lpage>558</lpage><pub-id pub-id-type="doi">10.1161/CIRCRESAHA.116.309278</pub-id><pub-id pub-id-type="medline">28154103</pub-id></nlm-citation></ref><ref id="ref28"><label>28</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kenton</surname><given-names>EJ</given-names> </name><name name-style="western"><surname>Culebras</surname><given-names>A</given-names> </name><name name-style="western"><surname>Fayad</surname><given-names>PB</given-names> </name><etal/></person-group><article-title>Impact of stroke call on the stroke neurology workforce in the United States: possible challenges and opportunities</article-title><source>J Stroke Cerebrovasc Dis</source><year>2018</year><month>07</month><volume>27</volume><issue>7</issue><fpage>2019</fpage><lpage>2025</lpage><pub-id pub-id-type="doi">10.1016/j.jstrokecerebrovasdis.2018.02.063</pub-id><pub-id pub-id-type="medline">29625799</pub-id></nlm-citation></ref><ref id="ref29"><label>29</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lee</surname><given-names>JV</given-names> </name><name name-style="western"><surname>Scott</surname><given-names>A</given-names> </name><name name-style="western"><surname>Osbun</surname><given-names>J</given-names> </name><name name-style="western"><surname>Zipfel</surname><given-names>G</given-names> </name></person-group><article-title>Impact of stroke call on career satisfaction and burnout for academic neurointerventionalists: a grounded theory model</article-title><source>World Neurosurg</source><year>2021</year><month>07</month><volume>151</volume><fpage>e552</fpage><lpage>e564</lpage><pub-id pub-id-type="doi">10.1016/j.wneu.2021.04.091</pub-id><pub-id pub-id-type="medline">33933697</pub-id></nlm-citation></ref><ref id="ref30"><label>30</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ni</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Kennebeck</surname><given-names>S</given-names> </name><name name-style="western"><surname>Dexheimer</surname><given-names>JW</given-names> </name><etal/></person-group><article-title>Automated clinical trial eligibility prescreening: increasing the efficiency of patient identification for clinical trials in the emergency department</article-title><source>J Am Med Inform Assoc</source><year>2015</year><month>01</month><volume>22</volume><issue>1</issue><fpage>166</fpage><lpage>178</lpage><pub-id pub-id-type="doi">10.1136/amiajnl-2014-002887</pub-id><pub-id pub-id-type="medline">25030032</pub-id></nlm-citation></ref><ref id="ref31"><label>31</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ni</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Wright</surname><given-names>J</given-names> </name><name name-style="western"><surname>Perentesis</surname><given-names>J</given-names> </name><etal/></person-group><article-title>Increasing the efficiency of trial-patient matching: automated clinical trial eligibility pre-screening for pediatric oncology patients</article-title><source>BMC Med Inf Decis Making</source><year>2015</year><month>04</month><day>14</day><volume>15</volume><issue>1</issue><fpage>28</fpage><pub-id pub-id-type="doi">10.1186/s12911-015-0149-3</pub-id><pub-id pub-id-type="medline">25881112</pub-id></nlm-citation></ref><ref id="ref32"><label>32</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Pollack</surname><given-names>AH</given-names> </name><name name-style="western"><surname>Pratt</surname><given-names>W</given-names> </name></person-group><article-title>Association of health record visualizations with physicians' cognitive load when prioritizing hospitalized patients</article-title><source>JAMA Netw Open</source><year>2020</year><month>01</month><day>3</day><volume>3</volume><issue>1</issue><fpage>e1919301</fpage><pub-id pub-id-type="doi">10.1001/jamanetworkopen.2019.19301</pub-id><pub-id pub-id-type="medline">31940040</pub-id></nlm-citation></ref><ref id="ref33"><label>33</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Semanik</surname><given-names>MG</given-names> </name><name name-style="western"><surname>Kleinschmidt</surname><given-names>PC</given-names> </name><name name-style="western"><surname>Wright</surname><given-names>A</given-names> </name><etal/></person-group><article-title>Impact of a problem-oriented view on clinical data retrieval</article-title><source>J Am Med Inform Assoc</source><year>2021</year><month>04</month><day>23</day><volume>28</volume><issue>5</issue><fpage>899</fpage><lpage>906</lpage><pub-id pub-id-type="doi">10.1093/jamia/ocaa332</pub-id><pub-id pub-id-type="medline">33566093</pub-id></nlm-citation></ref><ref id="ref34"><label>34</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>McGonagle</surname><given-names>EA</given-names> </name><name name-style="western"><surname>Karavite</surname><given-names>DJ</given-names> </name><name name-style="western"><surname>Grundmeier</surname><given-names>RW</given-names> </name><etal/></person-group><article-title>Evaluation of an antimicrobial stewardship decision support for pediatric infections</article-title><source>Appl Clin Inform</source><year>2023</year><month>01</month><volume>14</volume><issue>1</issue><fpage>108</fpage><lpage>118</lpage><pub-id pub-id-type="doi">10.1055/s-0042-1760082</pub-id><pub-id pub-id-type="medline">36754066</pub-id></nlm-citation></ref><ref id="ref35"><label>35</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Charbonnier</surname><given-names>G</given-names> </name><name name-style="western"><surname>Bonnet</surname><given-names>L</given-names> </name><name name-style="western"><surname>Biondi</surname><given-names>A</given-names> </name><name name-style="western"><surname>Moulin</surname><given-names>T</given-names> </name></person-group><article-title>Intracranial bleeding after reperfusion therapy in acute ischemic stroke</article-title><source>Front Neurol</source><year>2021</year><volume>11</volume><fpage>629920</fpage><pub-id pub-id-type="doi">10.3389/fneur.2020.629920</pub-id><pub-id pub-id-type="medline">33633661</pub-id></nlm-citation></ref><ref id="ref36"><label>36</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Campbell</surname><given-names>BCV</given-names> </name><name name-style="western"><surname>Meretoja</surname><given-names>A</given-names> </name><name name-style="western"><surname>Donnan</surname><given-names>GA</given-names> </name><name name-style="western"><surname>Davis</surname><given-names>SM</given-names> </name></person-group><article-title>Twenty-year history of the evolution of stroke thrombolysis with intravenous alteplase to reduce long-term disability</article-title><source>Stroke</source><year>2015</year><month>08</month><volume>46</volume><issue>8</issue><fpage>2341</fpage><lpage>2346</lpage><pub-id pub-id-type="doi">10.1161/STROKEAHA.114.007564</pub-id><pub-id pub-id-type="medline">26152294</pub-id></nlm-citation></ref><ref id="ref37"><label>37</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Lin</surname><given-names>YC</given-names> </name><name name-style="western"><surname>Christen</surname><given-names>V</given-names> </name><name name-style="western"><surname>Gro&#x00DF;</surname><given-names>A</given-names> </name><etal/></person-group><article-title>Evaluating cross-lingual semantic annotation for medical forms</article-title><year>2020</year><conf-name>13th International Conference on Health Informatics</conf-name><conf-loc>Valletta, Malta</conf-loc><fpage>145</fpage><lpage>155</lpage><pub-id pub-id-type="doi">10.5220/0008979901450155</pub-id></nlm-citation></ref><ref id="ref38"><label>38</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chang</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>X</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>J</given-names> </name><etal/></person-group><article-title>A survey on evaluation of large language models</article-title><source>ACM Trans Intell Syst Technol</source><year>2024</year><month>06</month><day>30</day><volume>15</volume><issue>3</issue><fpage>1</fpage><lpage>45</lpage><pub-id pub-id-type="doi">10.1145/3641289</pub-id></nlm-citation></ref><ref id="ref39"><label>39</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zhou</surname><given-names>L</given-names> </name><name name-style="western"><surname>Schellaert</surname><given-names>W</given-names> </name><name name-style="western"><surname>Mart&#x00ED;nez-Plumed</surname><given-names>F</given-names> </name><name name-style="western"><surname>Moros-Daval</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Ferri</surname><given-names>C</given-names> </name><name name-style="western"><surname>Hern&#x00E1;ndez-Orallo</surname><given-names>J</given-names> </name></person-group><article-title>Larger and more instructable language models become less reliable</article-title><source>Nature New Biol</source><year>2024</year><month>10</month><volume>634</volume><issue>8032</issue><fpage>61</fpage><lpage>68</lpage><pub-id pub-id-type="doi">10.1038/s41586-024-07930-y</pub-id><pub-id pub-id-type="medline">39322679</pub-id></nlm-citation></ref><ref id="ref40"><label>40</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Thirunavukarasu</surname><given-names>AJ</given-names> </name><name name-style="western"><surname>Ting</surname><given-names>DSJ</given-names> </name><name name-style="western"><surname>Elangovan</surname><given-names>K</given-names> </name><name name-style="western"><surname>Gutierrez</surname><given-names>L</given-names> </name><name name-style="western"><surname>Tan</surname><given-names>TF</given-names> </name><name name-style="western"><surname>Ting</surname><given-names>DSW</given-names> </name></person-group><article-title>Large language models in medicine</article-title><source>Nat Med</source><year>2023</year><month>08</month><volume>29</volume><issue>8</issue><fpage>1930</fpage><lpage>1940</lpage><pub-id pub-id-type="doi">10.1038/s41591-023-02448-8</pub-id><pub-id pub-id-type="medline">37460753</pub-id></nlm-citation></ref><ref id="ref41"><label>41</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Liu</surname><given-names>S</given-names> </name><name name-style="western"><surname>McCoy</surname><given-names>AB</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>Q</given-names> </name><name name-style="western"><surname>Wright</surname><given-names>A</given-names> </name></person-group><article-title>Integrating rule-based NLP and large language models for statin information extraction from clinical notes</article-title><source>Int J Med Inform</source><year>2026</year><month>01</month><volume>205</volume><fpage>106104</fpage><pub-id pub-id-type="doi">10.1016/j.ijmedinf.2025.106104</pub-id><pub-id pub-id-type="medline">40925145</pub-id></nlm-citation></ref><ref id="ref42"><label>42</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lange</surname><given-names>L</given-names> </name><name name-style="western"><surname>Adel</surname><given-names>H</given-names> </name><name name-style="western"><surname>Str&#x00F6;tgen</surname><given-names>J</given-names> </name><name name-style="western"><surname>Klakow</surname><given-names>D</given-names> </name></person-group><article-title>CLIN-X: pre-trained language models and a study on cross-task transfer for concept extraction in the clinical domain</article-title><source>Bioinformatics</source><year>2022</year><month>06</month><day>13</day><volume>38</volume><issue>12</issue><fpage>3267</fpage><lpage>3274</lpage><pub-id pub-id-type="doi">10.1093/bioinformatics/btac297</pub-id><pub-id pub-id-type="medline">35485748</pub-id></nlm-citation></ref><ref id="ref43"><label>43</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Cascella</surname><given-names>M</given-names> </name><name name-style="western"><surname>Montomoli</surname><given-names>J</given-names> </name><name name-style="western"><surname>Bellini</surname><given-names>V</given-names> </name><name name-style="western"><surname>Bignami</surname><given-names>E</given-names> </name></person-group><article-title>Evaluating the feasibility of ChatGPT in healthcare: an analysis of multiple clinical and research scenarios</article-title><source>J Med Syst</source><year>2023</year><month>03</month><day>4</day><volume>47</volume><issue>1</issue><fpage>33</fpage><pub-id pub-id-type="doi">10.1007/s10916-023-01925-4</pub-id><pub-id pub-id-type="medline">36869927</pub-id></nlm-citation></ref><ref id="ref44"><label>44</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Petzoldt</surname><given-names>T</given-names> </name><name name-style="western"><surname>B&#x00E4;r</surname><given-names>N</given-names> </name><name name-style="western"><surname>Ihle</surname><given-names>C</given-names> </name><name name-style="western"><surname>Krems</surname><given-names>JF</given-names> </name></person-group><article-title>Learning effects in the lane change task (LCT)&#x2014;evidence from two experimental studies</article-title><source>Transp Res F: Traffic Psychol Behav</source><year>2011</year><month>01</month><volume>14</volume><issue>1</issue><fpage>1</fpage><lpage>12</lpage><pub-id pub-id-type="doi">10.1016/j.trf.2010.09.001</pub-id></nlm-citation></ref><ref id="ref45"><label>45</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Brooks</surname><given-names>JL</given-names> </name></person-group><article-title>Counterbalancing for serial order carryover effects in experimental condition orders</article-title><source>Psychol Methods</source><year>2012</year><month>12</month><volume>17</volume><issue>4</issue><fpage>600</fpage><lpage>614</lpage><pub-id pub-id-type="doi">10.1037/a0029310</pub-id><pub-id pub-id-type="medline">22799624</pub-id></nlm-citation></ref><ref id="ref46"><label>46</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Elston</surname><given-names>DM</given-names> </name></person-group><article-title>The novelty effect</article-title><source>J Am Acad Dermatol</source><year>2021</year><month>09</month><volume>85</volume><issue>3</issue><fpage>565</fpage><lpage>566</lpage><pub-id pub-id-type="doi">10.1016/j.jaad.2021.06.846</pub-id><pub-id pub-id-type="medline">34153390</pub-id></nlm-citation></ref><ref id="ref47"><label>47</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>McCarney</surname><given-names>R</given-names> </name><name name-style="western"><surname>Warner</surname><given-names>J</given-names> </name><name name-style="western"><surname>Iliffe</surname><given-names>S</given-names> </name><name name-style="western"><surname>van Haselen</surname><given-names>R</given-names> </name><name name-style="western"><surname>Griffin</surname><given-names>M</given-names> </name><name name-style="western"><surname>Fisher</surname><given-names>P</given-names> </name></person-group><article-title>The Hawthorne effect: a randomised, controlled trial</article-title><source>BMC Med Res Methodol</source><year>2007</year><month>07</month><day>3</day><volume>7</volume><issue>1</issue><fpage>30</fpage><pub-id pub-id-type="doi">10.1186/1471-2288-7-30</pub-id><pub-id pub-id-type="medline">17608932</pub-id></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Multimedia Appendix 1</label><p>Supplementary Tables S1&#x2013;S4 showing additional study results.</p><media xlink:href="medinform_v13i1e80072_app1.pdf" xlink:title="PDF File, 61 KB"/></supplementary-material></app-group></back></article>