<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR Med Inform</journal-id><journal-id journal-id-type="publisher-id">medinform</journal-id><journal-id journal-id-type="index">7</journal-id><journal-title>JMIR Medical Informatics</journal-title><abbrev-journal-title>JMIR Med Inform</abbrev-journal-title><issn pub-type="epub">2291-9694</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v13i1e76848</article-id><article-id pub-id-type="doi">10.2196/76848</article-id><article-categories><subj-group subj-group-type="heading"><subject>Implementation Report</subject></subj-group></article-categories><title-group><article-title>A Bilingual On-Premises AI Agent for Clinical Drafting: Implementation Report of Seamless Electronic Health Records Integration in the Y-KNOT Project</article-title></title-group><contrib-group><contrib contrib-type="author" equal-contrib="yes"><name name-style="western"><surname>Kim</surname><given-names>Hanjae</given-names></name><degrees>BS</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib><contrib contrib-type="author" equal-contrib="yes"><name name-style="western"><surname>Lee</surname><given-names>So-Yeon</given-names></name><degrees>MD, PhD</degrees><xref ref-type="aff" rid="aff2">2</xref><xref ref-type="aff" rid="aff3">3</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib><contrib contrib-type="author" corresp="yes" equal-contrib="yes"><name name-style="western"><surname>You</surname><given-names>Seng Chan</given-names></name><degrees>MD, PhD</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff2">2</xref><xref ref-type="aff" rid="aff3">3</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Huh</surname><given-names>Sookyung</given-names></name><degrees>MS</degrees><xref ref-type="aff" rid="aff4">4</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Kim</surname><given-names>Jai-Eun</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff5">5</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Kim</surname><given-names>Sung-Tae</given-names></name><degrees>MS</degrees><xref ref-type="aff" rid="aff5">5</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Ko</surname><given-names>Dong-Ryul</given-names></name><degrees>MS</degrees><xref ref-type="aff" rid="aff5">5</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Kim</surname><given-names>Ji Hoon</given-names></name><degrees>MD, PhD</degrees><xref ref-type="aff" rid="aff3">3</xref><xref ref-type="aff" rid="aff6">6</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Lee</surname><given-names>Jae Hoon</given-names></name><degrees>MD, PhD</degrees><xref ref-type="aff" rid="aff7">7</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Lim</surname><given-names>Joon Seok</given-names></name><degrees>MD, PhD</degrees><xref ref-type="aff" rid="aff8">8</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Park</surname><given-names>Moo Suk</given-names></name><degrees>MD, PhD</degrees><xref ref-type="aff" rid="aff9">9</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Lee</surname><given-names>Kang Young</given-names></name><degrees>MD, PhD</degrees><xref ref-type="aff" rid="aff10">10</xref></contrib></contrib-group><aff id="aff1"><institution>Department of Biomedical Systems Informatics, College of Medicine, Yonsei University</institution><addr-line>50-1, Yonsei-Ro, Seodaemun-gu</addr-line><addr-line>Seoul</addr-line><country>Republic of Korea</country></aff><aff id="aff2"><institution>PHI Digital Healthcare</institution><addr-line>Seoul</addr-line><country>Republic of Korea</country></aff><aff id="aff3"><institution>Yonsei Institute for Digital Health, Yonsei University</institution><addr-line>Seoul</addr-line><country>Republic of Korea</country></aff><aff id="aff4"><institution>Department of Medical Records, Severance Hospital, Yonsei University Health System</institution><addr-line>Seoul</addr-line><country>Republic of Korea</country></aff><aff id="aff5"><institution>Saltlux Inc</institution><addr-line>Seoul</addr-line><country>Republic of Korea</country></aff><aff id="aff6"><institution>Department of Emergency Medicine, College of Medicine, Yonsei University</institution><addr-line>Seoul</addr-line><country>Republic of Korea</country></aff><aff id="aff7"><institution>Department of Anesthesiology and Pain Medicine, Anesthesia and Pain Research Institute, College of Medicine, Yonsei University</institution><addr-line>Seoul</addr-line><country>Republic of Korea</country></aff><aff id="aff8"><institution>Department of Radiology, College of Medicine, Yonsei University</institution><addr-line>Seoul</addr-line><country>Republic of Korea</country></aff><aff id="aff9"><institution>Division of Pulmonary and Critical Care Medicine, Department of Internal Medicine, College of Medicine, Yonsei University</institution><addr-line>Seoul</addr-line><country>Republic of Korea</country></aff><aff id="aff10"><institution>Department of Surgery, College of Medicine, Yonsei University</institution><addr-line>Seoul</addr-line><country>Republic of Korea</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Perrin</surname><given-names>Caroline</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Hong</surname><given-names>Pengyu</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Zhao</surname><given-names>Yang</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Seng Chan You, MD, PhD, Department of Biomedical Systems Informatics, College of Medicine, Yonsei University, 50-1, Yonsei-Ro, Seodaemun-gu, Seoul, 03722, Republic of Korea, 82 22282500; <email>chandryou@yuhs.ac</email></corresp><fn fn-type="equal" id="equal-contrib1"><label>*</label><p>these authors contributed equally</p></fn></author-notes><pub-date pub-type="collection"><year>2025</year></pub-date><pub-date pub-type="epub"><day>24</day><month>11</month><year>2025</year></pub-date><volume>13</volume><elocation-id>e76848</elocation-id><history><date date-type="received"><day>02</day><month>05</month><year>2025</year></date><date date-type="rev-recd"><day>26</day><month>08</month><year>2025</year></date><date date-type="accepted"><day>10</day><month>09</month><year>2025</year></date></history><copyright-statement>&#x00A9; Hanjae Kim, So-Yeon Lee, Seng Chan You, Sookyung Huh, Jai-Eun Kim, Sung-Tae Kim, Dong-Ryul Ko, Ji Hoon Kim, Jae Hoon Lee, Joon Seok Lim, Moo Suk Park, Kang Young Lee. Originally published in JMIR Medical Informatics (<ext-link ext-link-type="uri" xlink:href="https://medinform.jmir.org">https://medinform.jmir.org</ext-link>), 24.11.2025. </copyright-statement><copyright-year>2025</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Informatics, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://medinform.jmir.org/">https://medinform.jmir.org/</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://medinform.jmir.org/2025/1/e76848"/><abstract><sec><title>Background</title><p>Large language models (LLMs) have shown promise in reducing clinical documentation burden, yet their real-world implementation remains rare. Especially in South Korea, hospitals face several unique challenges, such as strict data sovereignty requirements and operating in environments where English is not the primary language for documentation. Therefore, we initiated the Your-Knowledgeable Navigator of Treatment (Y-KNOT) project, aimed at developing an on-premises bilingual LLM-based artificial intelligence (AI) agent system integrated with electronic health records (EHRs) for automated clinical drafting.</p></sec><sec><title>Objective</title><p>We present the Y-KNOT project and provide insights into implementing AI-assisted clinical drafting tools within constraints of health care system.</p></sec><sec sec-type="methods"><title>Methods</title><p>This project involved multiple stakeholders and encompassed three simultaneous processes: LLM development, clinical co-development, and EHR integration. We developed a foundation LLM by pretraining Llama3-8B with Korean and English medical corpora. During the clinical co-development phase, the LLM was instruction-tuned for specific documentation tasks through iterative cycles that aligned physicians&#x2019; clinical requirements, hospital data availability, documentation standards, and technical feasibility. The EHR integration phase focused on seamless AI agent incorporation into clinical workflows, involving document standardization, trigger points definition, and user interaction optimization.</p></sec><sec><title>Implementation (Results)</title><p>The resulting system processes emergency department discharge summaries and preanesthetic assessments while maintaining existing clinical workflows. The drafting process is automatically triggered by specific events, such as scheduled batch jobs, with medical records automatically fed into the LLM as input. The agent is built on premises, locating all the architecture inside the hospital.</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>The Y-KNOT project demonstrates the first seamless integration of an AI agent into an EHR system for clinical drafting. In collaboration with various clinical and administrative teams, we could promptly implement an LLM while addressing key challenges of data security, bilingual requirements, and workflow integration. Our experience highlights a practical and scalable approach to utilizing LLM-based AI agents for other health care institutions, paving the way for broader adoption of LLM-based solutions.</p></sec></abstract><kwd-group><kwd>artificial intelligence agent</kwd><kwd>large language models</kwd><kwd>documentation</kwd><kwd>electronic health records</kwd><kwd>insights</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><sec id="s1-1"><title>Background</title><p>Large language models (LLMs) have recently garnered significant attention, raising expectations for their applications in health care systems, encompassing clinical care support, research, and education [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref2">2</xref>]. However, most research has focused on implementations in the United States, and these solutions have yet to demonstrate meaningful reductions in administrative burden, as they mainly address tasks related to medical knowledge [<xref ref-type="bibr" rid="ref3">3</xref>].</p><p>South Korea&#x2019;s health care system is renowned for its efficiency, offering low costs with high accessibility and quality. However, this efficiency comes with inherent challenges in resource allocation. Health care providers often manage substantial workloads, seeing many patients in limited time frames. This situation has been particularly exacerbated by recent mass resignation of residents, which has left tertiary hospitals facing a critical shortage of human resources [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref5">5</xref>]. These circumstances underscore an urgent demand for meaningful assistance from LLMs.</p><p>Clinical documentation represents a significant burden for health care providers [<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref7">7</xref>], and there is growing optimism about LLMs&#x2019; potential to alleviate this burden [<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref9">9</xref>]. Clinical documentation involves condensing previous records, a task that LLMs excel at [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref11">11</xref>]. Accordingly, several studies have explored the capabilities of proprietary LLMs in generating clinical notes such as radiology referrals [<xref ref-type="bibr" rid="ref12">12</xref>] or discharge summaries [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref14">14</xref>]. However, implementing existing LLM solutions in South Korea faces several unique challenges. Korean medical regulations mandate that all medical records be stored exclusively on domestic servers or clouds [<xref ref-type="bibr" rid="ref15">15</xref>], making it impossible to utilize foreign commercial services like ChatGPT [<xref ref-type="bibr" rid="ref16">16</xref>]. Additionally, medical documents in Korea often exhibit mixed usage of Korean and English, requiring models capable of processing bilingual clinical notes effectively [<xref ref-type="bibr" rid="ref17">17</xref>]. Korea&#x2019;s Ministry of Food and Drug Safety does not classify artificial intelligence (AI) software for documentation as a medical device unless it involves medical judgements [<xref ref-type="bibr" rid="ref18">18</xref>], thereby exempting the requirement for regulatory approval. Nevertheless, these challenges hinder the widespread adoption of LLMs in Korea.</p><p>Although some pilot projects have attempted incorporating LLMs within electronic health records (EHRs), full-scale integration in real clinical settings remains rare. Due to their separate interface, manually retrieving information from EHRs and typing it into LLMs may ironically be time-consuming. In the study by Goh et al [<xref ref-type="bibr" rid="ref19">19</xref>], interaction with an LLM led to increased time in patient management reasoning. For LLMs to be continuously and effectively utilized by health care providers, connecting LLMs directly to EHRs is necessary.</p><p>To address these challenges, we initiated the Your-Knowledgeable Navigator of Treatment (Y-KNOT) project, aimed at developing a hospital-dedicated AI agent that seamlessly integrates a small, bilingual LLM with existing systems for automatic clinical drafting. This paper presents our experiences and insights from developing and implementing this solution.</p></sec><sec id="s1-2"><title>Objectives</title><p>We aim to demonstrate a practical approach to leveraging LLMs within the constraints of the health care system, potentially offering a model for similar implementations in other limited-resource settings. This paper highlights the multidisciplinary process of the Y-KNOT project, key features of the final implementation, and presents a human evaluation of its feasibility. Our experience provides valuable insights into the challenges and opportunities of integrating AI-assisted clinical drafting tools in health care settings while maintaining compliance with local regulations and addressing specific linguistic requirements.</p></sec></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Ethical Considerations</title><p>This study was reviewed and approved by the Institutional Review Board (IRB No. 4-2023-003) and the Data Review Board (DRB No. 24-01-005) of Severance Hospital. All patient data used in this study were retrieved from the hospital&#x2019;s research-purpose EHR database and deidentified prior to use, waiving the need for additional informed consent.</p></sec><sec id="s2-2"><title>Project Overview</title><p>The Y-KNOT project was conducted at Severance Hospital, a tertiary hospital in Seoul, South Korea. The project was initiated in June 2024 and the first service in routine clinical practice started in November 2024. The total cost of the project, including all expenses such as equipment and labor, did not exceed US $1,500,000. The final LLM model developed in this project is jointly owned by Severance Hospital and &#x2018;PHI Digital Healthcare Co., Ltd.&#x2019; (Seoul, South Korea).</p><p>This implementation report adheres to the iCHECK-DH (Guidelines and Checklist for the Reporting on Digital Health Implementations) reporting guidelines [<xref ref-type="bibr" rid="ref20">20</xref>] (<xref ref-type="supplementary-material" rid="app5">Checklist 1</xref>).</p><p>The project encompassed three major phases: medical foundation LLM development, clinical co-development, and EHR integration, which were carried out simultaneously. <xref ref-type="fig" rid="figure1">Figure 1</xref> displays the overall project landscape.</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>Overall landscape of the Y-KNOT project. B: billions; ED: emergency department; EHR: electronic health record; GB: gigabytes; LLM: large language model; Y-KNOT: Your-Knowledgeable Navigator of Treatment.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v13i1e76848_fig01.png"/></fig></sec><sec id="s2-3"><title>Development of Medical Foundation LLM</title><p>We first developed &#x2018;Y-KNOT-med-base,&#x2019; a small, bilingual LLM for general medical purposes. We used Luxia 2 [<xref ref-type="bibr" rid="ref21">21</xref>] developed by &#x2018;Saltlux Inc.&#x2019; (Seoul, South Korea) as a base model, which was built upon Llama 3 (8 billion parameters) [<xref ref-type="bibr" rid="ref22">22</xref>] and specialized for Korean language through pretraining on 1.5 terabytes of general corpus datasets. We decided to use a small model for rapid project completion, minimal latency in clinical settings, and environmental and economic sustainability. To adapt the model for medical applications, we further trained it with 90 GB of medical and 9 GB of general corpus datasets in Korean and English, consisting of open source and internally collected datasets. The pretraining data was augmented with instruction-response pairs for instruction pretraining [<xref ref-type="bibr" rid="ref23">23</xref>], which enables better alignment with domain-specific tasks. The training was conducted outside of the hospital to ensure greater flexibility and broader reusability of the foundation model by other institutions. Hyperparameter settings are provided in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p><p>To assess its capability to understand medical knowledge, we evaluated &#x2018;Y-KNOT-med-base&#x2019; on PubMedQA (biomedical question answering based on PubMed abstracts) [<xref ref-type="bibr" rid="ref24">24</xref>] for English and KorMedMCQA (multichoice question answering derived from licensing examinations for doctors, nurses, and pharmacists in South Korea) [<xref ref-type="bibr" rid="ref25">25</xref>] for Korean. We used 5-shot learning for both benchmarks and compared the results with other baseline models. Baseline models for PubMedQA were selected from the state-of-the-art models on the PubMedQA leaderboard [<xref ref-type="bibr" rid="ref26">26</xref>] whose parameter sizes were disclosed. Baseline models and their respective results for KorMedMCQA were taken from the original KorMedMCQA paper [<xref ref-type="bibr" rid="ref25">25</xref>], focusing specifically on nonproprietary multilingual models.</p></sec><sec id="s2-4"><title>Clinical Co-Development Phase</title><p>The Y-KNOT project involved intensive collaboration with related departments, including physicians, data scientists, software engineers, and medical record specialists. Working closely together, we established six core values: innovation, collaboration, integration, sovereignty, scrutiny, and efficiency (<xref ref-type="fig" rid="figure2">Figure 2</xref>).</p><fig position="float" id="figure2"><label>Figure 2.</label><caption><p>Core values of the Y-KNOT project. AI: artificial intelligence; EHR: electronic health record; IT: information technology; LLM: large language model; Y-KNOT: Your-Knowledgeable Navigator of Treatment.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v13i1e76848_fig02.png"/></fig><p>With the core values internalized, we conducted multiple iterative development cycles. Each cycle began with defining specific clinical documentation needs, followed by identifying available EHR data, assessing the technical feasibility of LLM implementation, and refining results through data adjustments and retraining of the model. Through these cycles, we progressively refined our understanding of automatable document types, confirmed the output templates, and determined the optimal approach for automation&#x2013;whether through rule-based systems or LLM inference. This process was essential for establishing a system that not only met immediate clinical needs but also ensured standardization across departments while maintaining compliance with medical documentation requirements.</p><p>To adapt the LLM for drafting specific document types&#x2013;emergency department (ED) discharge summary and preanesthetic assessment&#x2013;we instruction-tuned the Y-KNOT-med-base. We called the resulting model &#x2018;Y-KNOT-MD,&#x2019; which is an abbreviation for &#x2018;Y-KNOT medical document&#x2019; Medical document data for the model prompts were selected from the hospital&#x2019;s EHR database. Corresponding completions were prepared by physicians, addressing clinical needs while following the guidelines established by data scientists. The model was trained on 300 prompt-completion pairs for each document type. As the training involved patient data, it was conducted within the hospital environment to minimize the risk of data leakage. Details regarding hyperparameter settings are provided in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p></sec><sec id="s2-5"><title>EHR Integration Phase</title><p>In parallel with previously described phases, we conducted comprehensive EHR integration planning with the hospital&#x2019;s EHR team. This phase focused on defining the optimal service architecture to seamlessly integrate the AI agent into existing clinical workflows. It encompassed three key components: medical document standardization, service trigger point definition, and user interaction optimization.</p><p>First, we screened medical document forms from the EHR system to be used for the actual service. Out of 2201 different document forms, total 989 forms were selected. The rest were excluded due to inconsistent usage, absence of textual content, or their association with surveys, referrals, palliative care or physical therapies. This decision was reached after numerous meetings with the medical records team and clinicians. Then, we standardized the selected forms based on Fast Healthcare Interoperability Resource (FHIR) [<xref ref-type="bibr" rid="ref27">27</xref>] standards. This standardization not only enhanced interoperability for existing documentation but also established a robust framework for future development, ensuring long-term system scalability and maintainability.</p><p>Second, we mapped precise trigger points for AI agent activation to ensure assistance without disrupting existing clinical routines. The system supports both real-time triggers and batch processing. We carefully selected the optimal time for batch processing to minimize potential system load, and tested system latency to ensure that the integration would not impact the EHR&#x2019;s overall performance.</p><p>Third, we established a documentation display and a user interaction framework that maximized efficiency while preserving physician control over final documentation. The interface enabled quick review and editing of AI-generated content through intuitive controls for accepting, modifying, or rejecting suggestions. This design emphasized minimal click paths to streamline the documentation process.</p><p>To ensure data sovereignty, all infrastructures including servers and databases were hosted within the hospital&#x2019;s secure on-premises environment.</p></sec><sec id="s2-6"><title>Predefined Clinical Evaluation Criteria</title><p>Before the deployment in actual clinical setting, we evaluated the qualities of automatically generated ED discharge summaries and preanesthetic assessments to assess the performance of the AI agent. For each type of document, 100 pairs of input data, which had not been used during the development, and consequent model outputs were provided to 2 physicians. The physicians graded the outputs in terms of consistency, coherence, fluency, relevance, safety, subjective satisfactory rate, and usability. In addition, the impact on decision-making was graded only for preanesthetic assessments. The specific criteria for each metric are listed in <xref ref-type="table" rid="table1">Table 1</xref>. All metrics were graded using 5-point Likert Scales, except for usability, which had a maximum score of 4, and impact on decision-making, which had a maximum score of 3. Higher scores indicated better output quality for all metrics. Mean scores were calculated for all metrics, except for impact on decision-making, where the proportion for each score was calculated.</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>Criteria for evaluating auto-generated drafts.</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Metrics</td><td align="left" valign="bottom">Range<sup><xref ref-type="table-fn" rid="table1fn1">a</xref></sup></td><td align="left" valign="bottom">Criteria</td></tr></thead><tbody><tr><td align="left" valign="top">Consistency</td><td align="left" valign="top">1&#x2010;5</td><td align="left" valign="top">The consistency of the information provided on the output</td></tr><tr><td align="left" valign="top">Coherence</td><td align="left" valign="top">1&#x2010;5</td><td align="left" valign="top">The logical structure of the output in context</td></tr><tr><td align="left" valign="top">Fluency</td><td align="left" valign="top">1&#x2010;5</td><td align="left" valign="top">The appropriateness in grammatical, lexical, or structural aspects of the output</td></tr><tr><td align="left" valign="top">Relevance</td><td align="left" valign="top">1&#x2010;5</td><td align="left" valign="top">The alignment of the output with the topic</td></tr><tr><td align="left" valign="top">Safety</td><td align="left" valign="top">1&#x2010;5</td><td align="left" valign="top">The correctness of medical information in the output</td></tr><tr><td align="left" valign="top">Subjective satisfactory rate</td><td align="left" valign="top">1&#x2010;5</td><td align="left" valign="top">Subjective measurement of overall satisfaction with the output</td></tr><tr><td align="left" valign="top">Usability</td><td align="left" valign="top">1&#x2010;4</td><td align="left" valign="top">Whether the output can be provided to the user without modifications</td></tr><tr><td align="left" valign="top">Impact on decision-making<sup><xref ref-type="table-fn" rid="table1fn2">b</xref></sup></td><td align="left" valign="top">1&#x2010;3</td><td align="left" valign="top">The extent to which the response influences medical judgment, categorized into three levels: positive, no impact, and negative</td></tr></tbody></table><table-wrap-foot><fn id="table1fn1"><p><sup>a</sup>A higher score indicates better quality of output in all metrics.</p></fn><fn id="table1fn2"><p><sup>b</sup>This metric was used solely for evaluating preanesthetic assessments.</p></fn></table-wrap-foot></table-wrap></sec></sec><sec id="s3"><title>Implementation (Results)</title><sec id="s3-1"><title>Performance Evaluation of Medical Knowledge and Language Capabilities</title><p>The &#x2018;Y-KNOT-med-base&#x2019; achieved an accuracy score of 75.2 on the PubMedQA. Despite its relatively small size and absence of fine-tuning process, the performance was comparable to state-of-the-art baselines which were fine-tuned on larger parameter scales. The average accuracy score was 55.8 on the KorMedMCQA (doctor: 47.0, nurse: 64.1, pharmacist: 56.2), outperforming other multilingual pretrained models on all three exam categories. Detailed performance results are provided in <xref ref-type="table" rid="table2">Tables 2</xref> and <xref ref-type="table" rid="table3">3</xref>.</p><table-wrap id="t2" position="float"><label>Table 2.</label><caption><p>Evaluation result of Y-KNOT-med-base<sup><xref ref-type="table-fn" rid="table2fn1">a</xref></sup> on PubMedQA<sup><xref ref-type="table-fn" rid="table2fn2">b</xref></sup>.</p></caption><table id="table2" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Model</td><td align="left" valign="bottom">Accuracy</td></tr></thead><tbody><tr><td align="left" valign="top">Meditron-70B</td><td align="char" char="." valign="top">81.6</td></tr><tr><td align="left" valign="top">Palmyra-Med-40B</td><td align="char" char="." valign="top">81.1</td></tr><tr><td align="left" valign="top">AntGLM-Med-10B</td><td align="char" char="." valign="top">80.6</td></tr><tr><td align="left" valign="top">Flan-PaLM-540B</td><td align="char" char="." valign="top">79</td></tr><tr><td align="left" valign="top">Y-KNOT-med-base-8B</td><td align="char" char="." valign="top">75.2</td></tr></tbody></table><table-wrap-foot><fn id="table2fn1"><p><sup>a</sup>Y-KNOT: Your-Knowledgeable Navigator of Treatment.</p></fn><fn id="table2fn2"><p><sup>b</sup>PubMedQA: PubMedQA dataset is freely available on Hugging Face[<xref ref-type="bibr" rid="ref28">28</xref>].</p></fn></table-wrap-foot></table-wrap><table-wrap id="t3" position="float"><label>Table 3.</label><caption><p>Evaluation result of Y-KNOT-med-base<sup><xref ref-type="table-fn" rid="table3fn1">a</xref></sup> on KorMedMCQA<sup><xref ref-type="table-fn" rid="table3fn2">b</xref></sup>.</p></caption><table id="table3" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Model</td><td align="left" valign="bottom" colspan="4">Accuracy</td></tr><tr><td align="left" valign="bottom"/><td align="left" valign="bottom">Doctor</td><td align="left" valign="bottom">Nurse</td><td align="left" valign="bottom">Pharm</td><td align="left" valign="bottom">Average</td></tr></thead><tbody><tr><td align="left" valign="top">Llama2-70B</td><td align="char" char="." valign="top">42.5</td><td align="char" char="." valign="top">63.5</td><td align="char" char="." valign="top">53.3</td><td align="char" char="." valign="top">53.1</td></tr><tr><td align="left" valign="top">Yi-34B</td><td align="char" char="." valign="top">40</td><td align="char" char="." valign="top">55.5</td><td align="char" char="." valign="top">52.8</td><td align="char" char="." valign="top">49.4</td></tr><tr><td align="left" valign="top">SOLAR-10.7B-v1.0</td><td align="char" char="." valign="top">37.2</td><td align="char" char="." valign="top">55.5</td><td align="char" char="." valign="top">54.1</td><td align="char" char="." valign="top">48.9</td></tr><tr><td align="left" valign="top">Mistral-7B-v0.1</td><td align="char" char="." valign="top">29.8</td><td align="char" char="." valign="top">42.1</td><td align="char" char="." valign="top">43.5</td><td align="char" char="." valign="top">38.5</td></tr><tr><td align="left" valign="top">Y-KNOT-med-base-8B</td><td align="char" char="." valign="top">47</td><td align="char" char="." valign="top">64.1</td><td align="char" char="." valign="top">56.2</td><td align="char" char="." valign="top">55.8</td></tr></tbody></table><table-wrap-foot><fn id="table3fn1"><p><sup>a</sup>Y-KNOT: Your-Knowledgeable Navigator of Treatment.</p></fn><fn id="table3fn2"><p><sup>b</sup>KorMedMCQA dataset is freely available on Hugging Face [<xref ref-type="bibr" rid="ref29">29</xref>]</p></fn></table-wrap-foot></table-wrap></sec><sec id="s3-2"><title>Automatic Drafting of Clinical Documents</title><p>For ED discharge summary, the AI agent drafts the whole contents in one paragraph, which includes past medical histories, reason for the visit, and the details of specialty consultations or treatments. In response to the urgent and fast-paced nature of the ED, the outputs are designed to be as concise as possible, meeting the specific requirements of the physicians.</p><p>For preanesthetic assessment, the agent drafts a patient&#x2019;s background information required for preparing anesthesia, including basic information, past medical histories, medications, examination results, and other specialty consultation histories. Contents requiring medical judgment, such as anesthesiologist&#x2019;s opinion or premedication guides, or American Society of Anesthesiologists (ASA) classification, were excluded as an LLM that makes medical judgements could be risky.</p><p>Detailed examples of generated drafts are provided in <xref ref-type="fig" rid="figure3">Figure 3</xref>.</p><fig position="float" id="figure3"><label>Figure 3.</label><caption><p>Examples of input data types and subsequent output contents of auto-generated drafts. All medical records used as input data are converted into Fast Healthcare Interoperability Resource (FHIR) standards. Criteria for selecting input data are stated in parentheses. Note that the examples provided in the figure are simplified versions of the actual data, which originally contains a mixture of Korean and English. The untranslated figure can be found in <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>. (A) An example of input data types and output contents of a drafted emergency department discharge summaries; (B) An example of input data types and output contents of drafted preanesthetic assessments. ED: emergency department; LLM: large language model; OCS: order communication system; Y-KNOT: Your-Knowledgeable Navigator of Treatment.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v13i1e76848_fig03.png"/></fig></sec><sec id="s3-3"><title>Integration and Implementation in Clinical Practice</title><p>The Y-KNOT service is currently deployed at Severance Hospital for real-world use. Since the agent is fully integrated into the EHR system, the drafting process is automatically triggered through two familiar physicians&#x2019; workflows. For ED discharge summaries, physicians can initiate drafting by placing a &#x201C;draft creation&#x201D; order, similar to medication orders, due to the need for prompt creation in acute care settings (<xref ref-type="fig" rid="figure4">Figure 4A</xref>). For preanesthetic assessments, which are associated with scheduled surgeries, the system generates drafts in batch according to a predetermined schedule. As a physician opens a form for documentation, auto-generated drafts show up in the pop-up window (<xref ref-type="fig" rid="figure4">Figure 4B</xref>). No external programs other than the EHR system are required to use the LLM. The entire process is similar to usual documentation workflows, except physicians can now load drafts with a single click instead of writing them from scratch. This also prevents potential risks of adversarial attacks [<xref ref-type="bibr" rid="ref30">30</xref>] by keeping users away from instructing the LLM. Videos demonstrating the actual clinical use of the service are available in <xref ref-type="supplementary-material" rid="app3">Multimedia Appendices 3</xref> and <xref ref-type="supplementary-material" rid="app4">4</xref>.</p><fig position="float" id="figure4"><label>Figure 4.</label><caption><p>User interaction with the EHR system for automatic clinical drafting. (A) Requesting a draft creation through the order communication system; (B) Reviewing the auto-generated draft in the pop-up window. ED: emergency department.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v13i1e76848_fig04.png"/></fig><p>When the drafting is initiated, relevant patient records in FHIR format are transmitted from the EHR server to the Y-KNOT system, which processes them using a combination of LLM and rule-based approaches. The system preprocesses these standardized records into multiple prompts, each designed to extract specific aspects of the document. The LLM processes these prompts independently and generates outputs which are eventually synthesized into a comprehensive document draft. This final draft is returned to the EHR for physician review and approval. This automatic process (<xref ref-type="fig" rid="figure5">Figure 5</xref>) operates through predefined application programming interfaces (APIs) that specify data exchange formats between system components.</p><fig position="float" id="figure5"><label>Figure 5.</label><caption><p>Overview of the automated drafting process with the AI agent in the EHR system. AI: artificial intelligence; EHR: electronic health record; FHIR: Fast Healthcare Interoperability Resource; LLM: large language model; Y-KNOT: Your-Knowledgeable Navigator of Treatment.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v13i1e76848_fig05.png"/></fig></sec><sec id="s3-4"><title>Clinical Performance and Impact Assessment</title><p>The mean scores graded on drafted ED discharge summaries were 4.78 for consistency, 4.60 for coherence, 4.55 for fluency, 4.72 for relevance, 4.73 for safety, 3.95 for subjective satisfactory rate, and 3.32 for usability. The mean scores on drafted preanesthetic assessments were 3.29 for consistency, 3.86 for coherence, 4.23 for fluency, 3.37 for relevance, 3.88 for safety, 3.14 for subjective satisfactory rate, and 2.58 for usability. Additionally, out of 200 individual ratings on the impact on decision-making of preanesthetic assessments (2 raters evaluating 100 drafts), 69 (34.5%) were judged to be positive and 98 (49.0%) as having no impact, while 33 (16.5%) were judged to be negative (<xref ref-type="table" rid="table4">Table 4</xref>).</p><table-wrap id="t4" position="float"><label>Table 4.</label><caption><p>Clinical evaluation results on drafts generated by the Y-KNOT<sup><xref ref-type="table-fn" rid="table4fn1">a</xref></sup> AI agent.</p></caption><table id="table4" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Metrics</td><td align="left" valign="bottom">ED<sup><xref ref-type="table-fn" rid="table4fn2">b</xref></sup> discharge summaries (n=200)</td><td align="left" valign="bottom">Preanesthetic assessments (n=200)</td></tr></thead><tbody><tr><td align="left" valign="top">Consistency, mean (SD)</td><td align="char" char="." valign="top">4.78 (0.56)</td><td align="char" char="." valign="top">3.29 (1.10)</td></tr><tr><td align="left" valign="top">Coherence, mean (SD)</td><td align="char" char="." valign="top">4.6 (0.75)</td><td align="char" char="." valign="top">3.86 (0.82)</td></tr><tr><td align="left" valign="top">Fluency, mean (SD)</td><td align="char" char="." valign="top">4.55 (0.73)</td><td align="char" char="." valign="top">4.23 (0.69)</td></tr><tr><td align="left" valign="top">Relevance, mean (SD)</td><td align="char" char="." valign="top">4.72 (0.61)</td><td align="char" char="." valign="top">3.37 (0.91)</td></tr><tr><td align="left" valign="top">Safety, mean (SD)</td><td align="char" char="." valign="top">4.73 (0.63)</td><td align="char" char="." valign="top">3.88 (0.94)</td></tr><tr><td align="left" valign="top">Subjective satisfactory rate, mean (SD)</td><td align="char" char="." valign="top">3.95 (1.03)</td><td align="char" char="." valign="top">3.14 (1.10)</td></tr><tr><td align="left" valign="top">Usability<sup>b</sup>, mean (SD)</td><td align="char" char="." valign="top">3.32 (0.76)</td><td align="char" char="." valign="top">2.58 (0.87)</td></tr><tr><td align="left" valign="top" colspan="3">Impact on decision-making, n (%)</td></tr><tr><td align="left" valign="top">&#x2003;Positive impacts</td><td align="left" valign="top">&#x2014;</td><td align="char" char="." valign="top">69 (34.5)</td></tr><tr><td align="left" valign="top">&#x2003;No impacts</td><td align="left" valign="top">&#x2014;</td><td align="char" char="." valign="top">98 (49.0)</td></tr><tr><td align="left" valign="top">&#x2003;Negative impacts</td><td align="left" valign="top">&#x2014;</td><td align="char" char="." valign="top">33 (16.5)</td></tr></tbody></table><table-wrap-foot><fn id="table4fn1"><p><sup>a</sup>Y-KNOT: Your-Knowledgeable Navigator of Treatment.</p></fn><fn id="table4fn2"><p><sup>b</sup>ED: Emergency Department.</p></fn></table-wrap-foot></table-wrap></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Implications</title><p>The Y-KNOT project demonstrates a successful implementation of a bilingual on-premises LLM-based clinical drafting system that seamlessly integrates with existing EHR workflows in a high-throughput health care setting. Through close collaboration with stakeholders, we addressed several critical challenges.</p><p>Our decision to use a small model was crucial for real-world deployment, as larger models require substantial computational resources and costs. Although smaller models may have limitations in processing lengthy contexts and complex medical information, proper instruction-tuning enables them to perform specific tasks on par with larger models [<xref ref-type="bibr" rid="ref31">31</xref>]. While initial clinical evaluation results of our model were modest, we prioritized rapid development using a small model to address the hospital&#x2019;s pressing clinical needs. We transparently disclosed the evaluation results to all stakeholders and educated physicians prior to deployment regarding the possibility of errors in model outputs, with specific examples provided. After the deployment, discharge summary documentation completion rates in the Emergency Department improved from 92.7% in Apr-May 2024 to 98.0% in Apr-May 2025. Our experience demonstrates that carefully optimized smaller models can effectively support specific clinical drafting tasks when combined with thoughtful implementation strategies.</p><p>Moreover, our small model could address the unique challenges of resource-limited health care settings. South Korea&#x2019;s health care system, while renowned for its accessibility, operates at significantly low costs, with the average cost per outpatient visit at tertiary hospitals being less than US $15, whereas in the United States, it exceeds US $100 [<xref ref-type="bibr" rid="ref32">32</xref>]. This cost structure makes it financially unfeasible to deploy large-scale LLMs as the operational costs would significantly exceed the revenue per visit. Currently, the operational costs of the Y-KNOT service are solely covered by the hospital, but a national funding strategy could offer a more efficient approach for broader implementation in the future.</p><p>South Korea&#x2019;s health care system is also highly efficient, with outpatient consultation times averaging merely 4.2 minutes [<xref ref-type="bibr" rid="ref33">33</xref>], which is significantly shorter than the 20 minutes in the US [<xref ref-type="bibr" rid="ref34">34</xref>]. This extreme time constraint presented both an opportunity and a challenge: while it highlighted an urgent need for documentation assistance, it also demanded exceptional efficiency in implementation. We addressed this challenge through strategic EHR integration, enabling documentation drafting to occur concurrently with other clinical tasks which eliminated perceived latency and maintained the rapid pace of clinical practice. This approach demonstrates how AI can be successfully integrated even in highly time-constrained, cost-sensitive clinical environments without disrupting established workflows.</p><p>To ensure scalable deployment across different health care institutions, we standardized all document templates to FHIR format and implemented API-based data exchange. As of December 2022, the Ministry of Health and Welfare in South Korea has established a taskforce to implement a 5-year strategy to accelerate health data standardization, which includes the specific task of developing and deploying Korea-specific FHIR standards [<xref ref-type="bibr" rid="ref35">35</xref>]. In line with this initiative, we created a system that can be readily deployed to any EHR system that adheres to FHIR standards. This architectural decision not only ensures interoperability but also significantly reduces the technical barriers for other health care institutions wanting to implement similar AI-assisted documentation systems.</p></sec><sec id="s4-2"><title>Limitations</title><p>Our study has several limitations. First, clinical evaluation involved only 2 personnel per document type, potentially introducing bias due to small sample size. Second, we have not validated its performance across multiple institutions. Multicenter implementation studies would be crucial to establish the generalizability of our approach and identify potential institution-specific adaptation requirements. Third, this study does not include prospective results measuring the system&#x2019;s impact on physician workload and documentation efficiency. Previous studies have raised concerns that the need for validating AI-generated outputs might paradoxically increase physician workload [<xref ref-type="bibr" rid="ref36">36</xref>], making it crucial to evaluate the actual time savings through rigorous clinical studies [<xref ref-type="bibr" rid="ref37">37</xref>,<xref ref-type="bibr" rid="ref38">38</xref>]. We are actively conducting such prospective studies and plan to report our findings in future publications. Impacts on clinical decision-making or patient outcomes should also be assessed through long-term studies. Fourth, the financial implications remain to be fully understood. While there are expectations of cost benefits from AI implementation in health care [<xref ref-type="bibr" rid="ref39">39</xref>], recent studies of similar technologies like ambient-listening AI have shown no significant financial advantages [<xref ref-type="bibr" rid="ref40">40</xref>]. Future research should address these limitations through in-depth analyses with multicenter implementation studies, prospective evaluations of efficiency gains, clinical impact, and cost-effectiveness.</p></sec><sec id="s4-3"><title>Conclusions</title><p>This study provides a comprehensive account of developing and integrating an LLM-based AI agent for clinical drafting in routine clinical practice. We developed a specialized LLM by taking into consideration issues such as data sovereignty, bilingual challenges, and cost-effectiveness. In collaboration with various stakeholders, we integrated this solution with the EHR system to ensure practical usability by physicians without interruption of existing workflow.</p></sec></sec></body><back><ack><p>The authors thank the following contributors at Yonsei University Health System for their technical assistance and advice to the Y-KNOT project. They did not receive any separate compensation beyond their regular institutional responsibilities for these contributions: Jihyun Yang and Jeeeun Jung at the Department of Medical Records, Division of Digital Health; Eunhye Kang, Hyekyung Jung, Younghee Lim, and JaeHyeon Park at the Department of Information Services, Division of Digital Health; Young ah Kim, Heui seok Kang, and Hyunsook Seong at the Department of Data Services, Division of Digital Health; Eun Jung Kang, Kyung Han Kim, and Jong Myoung Kim at the Digital Health Strategy Team, Division of Digital Health, Yonsei University Health System, Seoul, Republic of Korea. Furthermore, the authors thank the members of the Data Science Department, PHI Digital Healthcare, Seoul, Republic of Korea, for their contributions to this project.</p></ack><notes><sec><title>Data Availability</title><p>Source data, including medical records from electronic health records, is not publicly available due to the policy of the healthcare institution and privacy protection regulations. Datasets used as benchmarks are publicly accessible via the provided references. Raw scores graded for clinical performance can be provided upon reasonable request to the authors. The code used in this study is not publicly available due to company policies and data confidentiality restrictions.</p></sec></notes><fn-group><fn fn-type="con"><p>Conceptualization: SYL, SCY</p><p>Data curation: HK, JEK, STK, DRK</p><p>Formal analysis: HK, JEK, STK, DRK</p><p>Funding acquisition: SCY, JSL, KYL</p><p>Investigation: HK, SYL, SCY</p><p>Methodology: HK, SYL, SCY, JHK, JHL</p><p>Project administration: SYL, SCY, SH</p><p>Resources: SCY, SH, JSL, KYL</p><p>Software: JEK, STK, DRK</p><p>Supervision: SCY</p><p>Validation: HK, SYL, JHK, JHL, JSL, MSP, KYL</p><p>Visualization: HK</p><p>Writing &#x2013; original draft: HK, SYL, SCY</p><p>Writing &#x2013; review &#x0026; editing: HK, SYL, SCY, SH, JEK, STK, DRK, JHK, JHL, JSL, MSP, KYL</p></fn><fn fn-type="conflict"><p>This research was supported by PHI Digital Healthcare and is associated with Patent Applications PATENT-2025&#x2010;0039190, PATENT-2025&#x2010;0039191, PATENT-2025&#x2010;0039192, PATENT-2025&#x2010;0039193, and PATENT-2025&#x2010;0039194. SCY reports grants from Daiichi Sankyo. He is a coinventor of granted Korea Patent DP-2023&#x2010;1223 and DP-2023&#x2010;0920, and pending Patent Applications DP-2024&#x2010;0909, DP-2024&#x2010;0908, DP-2022&#x2010;1658, DP-2022&#x2010;1478, and DP-2022&#x2010;1365 unrelated to current work. SCY is a chief executive officer of PHI Digital Healthcare. HK was an employee of PHI Digital Healthcare during this study. SYL is an employee of PHI Digital Healthcare. JEK, STK, and DRK are employees of Saltlux Inc. KYL serves as a general director of Severance Hospital, Yonsei University Health System. Other authors have no potential conflicts of interest to disclose.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">AI</term><def><p>artificial intelligence</p></def></def-item><def-item><term id="abb2">API</term><def><p>application programming interfaces</p></def></def-item><def-item><term id="abb3">EHR</term><def><p>electronic health record</p></def></def-item><def-item><term id="abb4">FHIR</term><def><p>Fast Healthcare Interoperability Resource</p></def></def-item><def-item><term id="abb5">LLM</term><def><p>large language model</p></def></def-item><def-item><term id="abb6">Y-KNOT</term><def><p>Your-Knowledgeable Navigator of Treatment</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Thirunavukarasu</surname><given-names>AJ</given-names> </name><name name-style="western"><surname>Ting</surname><given-names>DSJ</given-names> </name><name name-style="western"><surname>Elangovan</surname><given-names>K</given-names> </name><name name-style="western"><surname>Gutierrez</surname><given-names>L</given-names> </name><name name-style="western"><surname>Tan</surname><given-names>TF</given-names> </name><name name-style="western"><surname>Ting</surname><given-names>DSW</given-names> </name></person-group><article-title>Large language models in medicine</article-title><source>Nat Med</source><year>2023</year><month>08</month><volume>29</volume><issue>8</issue><fpage>1930</fpage><lpage>1940</lpage><pub-id pub-id-type="doi">10.1038/s41591-023-02448-8</pub-id><pub-id pub-id-type="medline">37460753</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Clusmann</surname><given-names>J</given-names> </name><name name-style="western"><surname>Kolbinger</surname><given-names>FR</given-names> </name><name name-style="western"><surname>Muti</surname><given-names>HS</given-names> </name><etal/></person-group><article-title>The future landscape of large language models in medicine</article-title><source>Commun Med (Lond)</source><year>2023</year><month>10</month><day>10</day><volume>3</volume><issue>1</issue><fpage>141</fpage><pub-id pub-id-type="doi">10.1038/s43856-023-00370-1</pub-id><pub-id pub-id-type="medline">37816837</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bedi</surname><given-names>S</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Orr-Ewing</surname><given-names>L</given-names> </name><etal/></person-group><article-title>Testing and evaluation of health care applications of large language models: a systematic review</article-title><source>JAMA</source><year>2025</year><month>01</month><day>28</day><volume>333</volume><issue>4</issue><fpage>319</fpage><lpage>328</lpage><pub-id pub-id-type="doi">10.1001/jama.2024.21700</pub-id><pub-id pub-id-type="medline">39405325</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Yoon</surname><given-names>J</given-names> </name><name name-style="western"><surname>Lee</surname><given-names>JY</given-names> </name></person-group><article-title>Challenges arising from disruptions in Psychiatry Training: implications of residents&#x2019; mass resignation in South Korea</article-title><source>Acad Psychiatry</source><year>2025</year><month>06</month><volume>49</volume><issue>3</issue><fpage>297</fpage><lpage>298</lpage><pub-id pub-id-type="doi">10.1007/s40596-024-02108-0</pub-id><pub-id pub-id-type="medline">39702879</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Park</surname><given-names>J</given-names> </name><name name-style="western"><surname>Shin</surname><given-names>CH</given-names> </name><name name-style="western"><surname>Lee</surname><given-names>JY</given-names> </name></person-group><article-title>Why Did All the Residents Resign? Key Takeaways From the Junior Physicians&#x2019; Mass Walkout in South Korea</article-title><source>J Grad Med Educ</source><year>2024</year><month>08</month><volume>16</volume><issue>4</issue><fpage>402</fpage><lpage>406</lpage><pub-id pub-id-type="doi">10.4300/JGME-D-24-00227.1</pub-id><pub-id pub-id-type="medline">39148889</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Tajirian</surname><given-names>T</given-names> </name><name name-style="western"><surname>Stergiopoulos</surname><given-names>V</given-names> </name><name name-style="western"><surname>Strudwick</surname><given-names>G</given-names> </name><etal/></person-group><article-title>The influence of electronic health record use on physician burnout: cross-sectional survey</article-title><source>J Med Internet Res</source><year>2020</year><month>07</month><day>15</day><volume>22</volume><issue>7</issue><fpage>e19274</fpage><pub-id pub-id-type="doi">10.2196/19274</pub-id><pub-id pub-id-type="medline">32673234</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gaffney</surname><given-names>A</given-names> </name><name name-style="western"><surname>Woolhandler</surname><given-names>S</given-names> </name><name name-style="western"><surname>Cai</surname><given-names>C</given-names> </name><etal/></person-group><article-title>Medical documentation burden among US office-based physicians in 2019: a national study</article-title><source>JAMA Intern Med</source><year>2022</year><month>05</month><day>1</day><volume>182</volume><issue>5</issue><fpage>564</fpage><lpage>566</lpage><pub-id pub-id-type="doi">10.1001/jamainternmed.2022.0372</pub-id><pub-id pub-id-type="medline">35344006</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Haltaufderheide</surname><given-names>J</given-names> </name><name name-style="western"><surname>Ranisch</surname><given-names>R</given-names> </name></person-group><article-title>The ethics of ChatGPT in medicine and healthcare: a systematic review on large language models (LLMs)</article-title><source>NPJ Digit Med</source><year>2024</year><month>07</month><day>8</day><volume>7</volume><issue>1</issue><fpage>183</fpage><pub-id pub-id-type="doi">10.1038/s41746-024-01157-x</pub-id><pub-id pub-id-type="medline">38977771</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bednarczyk</surname><given-names>L</given-names> </name><name name-style="western"><surname>Reichenpfader</surname><given-names>D</given-names> </name><name name-style="western"><surname>Gaudet-Blavignac</surname><given-names>C</given-names> </name><etal/></person-group><article-title>Scientific evidence for clinical text summarization using large language models: scoping review</article-title><source>J Med Internet Res</source><year>2025</year><month>05</month><day>15</day><volume>27</volume><fpage>e68998</fpage><pub-id pub-id-type="doi">10.2196/68998</pub-id><pub-id pub-id-type="medline">40371947</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Van Veen</surname><given-names>D</given-names> </name><name name-style="western"><surname>Van Uden</surname><given-names>C</given-names> </name><name name-style="western"><surname>Blankemeier</surname><given-names>L</given-names> </name><etal/></person-group><article-title>Adapted large language models can outperform medical experts in clinical text summarization</article-title><source>Nat Med</source><year>2024</year><month>04</month><volume>30</volume><issue>4</issue><fpage>1134</fpage><lpage>1142</lpage><pub-id pub-id-type="doi">10.1038/s41591-024-02855-5</pub-id><pub-id pub-id-type="medline">38413730</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Tang</surname><given-names>L</given-names> </name><name name-style="western"><surname>Sun</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Idnay</surname><given-names>B</given-names> </name><etal/></person-group><article-title>Evaluating large language models on medical evidence summarization</article-title><source>NPJ Digit Med</source><year>2023</year><month>08</month><day>24</day><volume>6</volume><issue>1</issue><fpage>158</fpage><pub-id pub-id-type="doi">10.1038/s41746-023-00896-7</pub-id><pub-id pub-id-type="medline">37620423</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Barash</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Klang</surname><given-names>E</given-names> </name><name name-style="western"><surname>Konen</surname><given-names>E</given-names> </name><name name-style="western"><surname>Sorin</surname><given-names>V</given-names> </name></person-group><article-title>ChatGPT-4 assistance in optimizing Emergency Department Radiology referrals and imaging selection</article-title><source>J Am Coll Radiol</source><year>2023</year><month>10</month><volume>20</volume><issue>10</issue><fpage>998</fpage><lpage>1003</lpage><pub-id pub-id-type="doi">10.1016/j.jacr.2023.06.009</pub-id><pub-id pub-id-type="medline">37423350</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Tung</surname><given-names>JYM</given-names> </name><name name-style="western"><surname>Gill</surname><given-names>SR</given-names> </name><name name-style="western"><surname>Sng</surname><given-names>GGR</given-names> </name><etal/></person-group><article-title>Comparison of the quality of discharge letters written by large language models and junior clinicians: single-blinded study</article-title><source>J Med Internet Res</source><year>2024</year><month>07</month><day>24</day><volume>26</volume><fpage>e57721</fpage><pub-id pub-id-type="doi">10.2196/57721</pub-id><pub-id pub-id-type="medline">39047282</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kim</surname><given-names>H</given-names> </name><name name-style="western"><surname>Jin</surname><given-names>HM</given-names> </name><name name-style="western"><surname>Jung</surname><given-names>YB</given-names> </name><name name-style="western"><surname>You</surname><given-names>SC</given-names> </name></person-group><article-title>Patient-friendly discharge summaries in Korea based on ChatGPT: software development and validation</article-title><source>J Korean Med Sci</source><year>2024</year><month>04</month><day>29</day><volume>39</volume><issue>16</issue><fpage>e148</fpage><pub-id pub-id-type="doi">10.3346/jkms.2024.39.e148</pub-id><pub-id pub-id-type="medline">38685890</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="web"><article-title>Guidelines for the standards on facilities and equipment required for the management and preservation of electronic medical records [Article in Korean]</article-title><source>Korea Health Information Service</source><year>2022</year><month>07</month><access-date>2025-04-30</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.k-his.or.kr/board.es?mid=a10306020000&#x0026;bid=0016&#x0026;list_no=614&#x0026;act=view">https://www.k-his.or.kr/board.es?mid=a10306020000&#x0026;bid=0016&#x0026;list_no=614&#x0026;act=view</ext-link></comment></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="web"><person-group person-group-type="author"><collab>OpenAI</collab></person-group><source>Introducing ChatGPT</source><year>2022</year><access-date>2025-04-30</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://openai.com/blog/chatgpt">https://openai.com/blog/chatgpt</ext-link></comment></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kim</surname><given-names>K</given-names> </name><name name-style="western"><surname>Park</surname><given-names>S</given-names> </name><name name-style="western"><surname>Min</surname><given-names>J</given-names> </name><etal/></person-group><article-title>Multifaceted natural language processing task-based evaluation of bidirectional encoder representations from transformers models for bilingual (Korean and English) clinical notes: algorithm development and validation</article-title><source>JMIR Med Inform</source><year>2024</year><month>10</month><day>30</day><volume>12</volume><fpage>e52897</fpage><pub-id pub-id-type="doi">10.2196/52897</pub-id><pub-id pub-id-type="medline">39475725</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="web"><article-title>Guidelines on the review and approval of generative artificial intelligence (AI)-based medical devices [Article in Korean]</article-title><source>Ministry of Food and Drug Safety (Republic of Korea)</source><year>2025</year><access-date>2025-07-09</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.mfds.go.kr/brd/m_1060/view.do?seq=15628">https://www.mfds.go.kr/brd/m_1060/view.do?seq=15628</ext-link></comment></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Goh</surname><given-names>E</given-names> </name><name name-style="western"><surname>Gallo</surname><given-names>RJ</given-names> </name><name name-style="western"><surname>Strong</surname><given-names>E</given-names> </name><etal/></person-group><article-title>GPT-4 assistance for improvement of physician performance on patient care tasks: a randomized controlled trial</article-title><source>Nat Med</source><year>2025</year><month>04</month><volume>31</volume><issue>4</issue><fpage>1233</fpage><lpage>1238</lpage><pub-id pub-id-type="doi">10.1038/s41591-024-03456-y</pub-id><pub-id pub-id-type="medline">39910272</pub-id></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Perrin Franck</surname><given-names>C</given-names> </name><name name-style="western"><surname>Babington-Ashaye</surname><given-names>A</given-names> </name><name name-style="western"><surname>Dietrich</surname><given-names>D</given-names> </name><etal/></person-group><article-title>iCHECK-DH: Guidelines and Checklist for the Reporting on Digital Health Implementations</article-title><source>J Med Internet Res</source><year>2023</year><month>05</month><day>10</day><volume>25</volume><fpage>e46694</fpage><pub-id pub-id-type="doi">10.2196/46694</pub-id><pub-id pub-id-type="medline">37163336</pub-id></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="web"><article-title>Saltlux Luxia2 model 8B</article-title><source>AWS Marketplace</source><access-date>2025-07-09</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://aws.amazon.com/marketplace/pp/prodview-p5ejp5ln5syam">https://aws.amazon.com/marketplace/pp/prodview-p5ejp5ln5syam</ext-link></comment></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Dubey</surname><given-names>A</given-names> </name><name name-style="western"><surname>Jauhri</surname><given-names>A</given-names> </name><name name-style="western"><surname>Pandey</surname><given-names>A</given-names> </name><name name-style="western"><surname>Kadian</surname><given-names>A</given-names> </name><name name-style="western"><surname>Al-Dahle</surname><given-names>A</given-names> </name><name name-style="western"><surname>Letman</surname><given-names>A</given-names> </name><etal/></person-group><article-title>The llama 3 herd of models</article-title><source>arXiv</source><comment>Preprint posted online on  Nov 23, 2024</comment><pub-id pub-id-type="doi">10.48550/arXiv.2407.21783</pub-id></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Cheng</surname><given-names>D</given-names> </name><name name-style="western"><surname>Gu</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Huang</surname><given-names>S</given-names> </name><name name-style="western"><surname>Bi</surname><given-names>J</given-names> </name><name name-style="western"><surname>Huang</surname><given-names>M</given-names> </name><name name-style="western"><surname>Wei</surname><given-names>F</given-names> </name></person-group><article-title>Instruction pre-training: language models are supervised multitask learners</article-title><source>arXiv</source><comment>Preprint posted online on  Nov 28, 2024</comment><pub-id pub-id-type="doi">10.48550/arXiv.2406.14491</pub-id></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Jin</surname><given-names>Q</given-names> </name><name name-style="western"><surname>Dhingra</surname><given-names>B</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Cohen</surname><given-names>WW</given-names> </name><name name-style="western"><surname>Lu</surname><given-names>X</given-names> </name></person-group><article-title>PubMedQA: a dataset for biomedical research question answering</article-title><year>2019</year><month>09</month><day>13</day><conf-name>Proceedings of the 2019 Conference on Empirical Methods in Natural Language Processing and the 9th International Joint Conference on Natural Language Processing (EMNLP-IJCNLP</conf-name><pub-id pub-id-type="doi">10.18653/v1/D19-1259</pub-id></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Kweon</surname><given-names>S</given-names> </name><name name-style="western"><surname>Choi</surname><given-names>B</given-names> </name><name name-style="western"><surname>Kim</surname><given-names>M</given-names> </name><name name-style="western"><surname>Park</surname><given-names>RW</given-names> </name><name name-style="western"><surname>Choi</surname><given-names>E</given-names> </name></person-group><article-title>KorMedMCQA: multi-choice question answering benchmark for Korean healthcare professional licensing examinations</article-title><source>arXiv</source><comment>Preprint posted online on  Mar 5, 2024</comment><pub-id pub-id-type="doi">10.48550/arXiv.2403.01469</pub-id></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="web"><person-group person-group-type="author"><name name-style="western"><surname>Jin</surname><given-names>Q</given-names> </name></person-group><source>PubMedQA</source><access-date>2025-04-30</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://pubmedqa.github.io/">https://pubmedqa.github.io/</ext-link></comment></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="web"><source>HL7 FHIR release 4</source><access-date>2025-04-30</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://hl7.org/fhir/R4/index.html">https://hl7.org/fhir/R4/index.html</ext-link></comment></nlm-citation></ref><ref id="ref28"><label>28</label><nlm-citation citation-type="web"><article-title>Qiaojin/pubmedqa</article-title><source>Hugging Face</source><access-date>2025-07-09</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://huggingface.co/datasets/qiaojin/PubMedQA/">https://huggingface.co/datasets/qiaojin/PubMedQA/</ext-link></comment></nlm-citation></ref><ref id="ref29"><label>29</label><nlm-citation citation-type="web"><article-title>Sean0042/kormedmcqa</article-title><source>Hugging Face</source><access-date>2025-07-09</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://huggingface.co/datasets/sean0042/KorMedMCQA/">https://huggingface.co/datasets/sean0042/KorMedMCQA/</ext-link></comment></nlm-citation></ref><ref id="ref30"><label>30</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kim</surname><given-names>M</given-names> </name><name name-style="western"><surname>Kim</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Kang</surname><given-names>HJ</given-names> </name><etal/></person-group><article-title>Fine-tuning LLMs with medical data: can safety be ensured?</article-title><source>NEJM AI</source><year>2025</year><month>01</month><volume>2</volume><issue>1</issue><fpage>AIcs2400390</fpage><pub-id pub-id-type="doi">10.1056/AIcs2400390</pub-id></nlm-citation></ref><ref id="ref31"><label>31</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zhang</surname><given-names>T</given-names> </name><name name-style="western"><surname>Ladhak</surname><given-names>F</given-names> </name><name name-style="western"><surname>Durmus</surname><given-names>E</given-names> </name><name name-style="western"><surname>Liang</surname><given-names>P</given-names> </name><name name-style="western"><surname>McKeown</surname><given-names>K</given-names> </name><name name-style="western"><surname>Hashimoto</surname><given-names>TB</given-names> </name></person-group><article-title>Benchmarking large language models for news summarization</article-title><source>Trans Assoc Comput Linguist</source><year>2024</year><month>01</month><day>31</day><volume>12</volume><fpage>39</fpage><lpage>57</lpage><pub-id pub-id-type="doi">10.1162/tacl_a_00632</pub-id></nlm-citation></ref><ref id="ref32"><label>32</label><nlm-citation citation-type="report"><person-group person-group-type="author"><name name-style="western"><surname>Lee</surname><given-names>J</given-names> </name><name name-style="western"><surname>Son</surname><given-names>K</given-names> </name><name name-style="western"><surname>Kang</surname><given-names>T</given-names> </name></person-group><article-title>A review of outpatient visit trends in korea and other countries [Article in Korean]</article-title><year>2019</year><access-date>2025-10-22</access-date><publisher-name>Research Institute for Healthcare Policy, Korean Medical Association</publisher-name><comment><ext-link ext-link-type="uri" xlink:href="https://rihp.re.kr/bbs/board.php?bo_table=research_report&#x0026;wr_id=293&#x0026;sst=wr_hit&#x0026;sod=asc&#x0026;sop=and&#x0026;page=17">https://rihp.re.kr/bbs/board.php?bo_table=research_report&#x0026;wr_id=293&#x0026;sst=wr_hit&#x0026;sod=asc&#x0026;sop=and&#x0026;page=17</ext-link></comment></nlm-citation></ref><ref id="ref33"><label>33</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lee</surname><given-names>CH</given-names> </name><name name-style="western"><surname>Lim</surname><given-names>H</given-names> </name><name name-style="western"><surname>Kim</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Park</surname><given-names>AH</given-names> </name><name name-style="western"><surname>Park</surname><given-names>EC</given-names> </name><name name-style="western"><surname>Kang</surname><given-names>JG</given-names> </name></person-group><article-title>Analysis of appropriate outpatient consultation time for clinical departments</article-title><source>HPM</source><year>2014</year><month>09</month><day>30</day><volume>24</volume><issue>3</issue><fpage>254</fpage><lpage>260</lpage><pub-id pub-id-type="doi">10.4332/KJHPA.2014.24.3.254</pub-id></nlm-citation></ref><ref id="ref34"><label>34</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Irving</surname><given-names>G</given-names> </name><name name-style="western"><surname>Neves</surname><given-names>AL</given-names> </name><name name-style="western"><surname>Dambha-Miller</surname><given-names>H</given-names> </name><etal/></person-group><article-title>International variations in primary care physician consultation time: a systematic review of 67 countries</article-title><source>BMJ Open</source><year>2017</year><month>11</month><day>8</day><volume>7</volume><issue>10</issue><fpage>e017902</fpage><pub-id pub-id-type="doi">10.1136/bmjopen-2017-017902</pub-id><pub-id pub-id-type="medline">29118053</pub-id></nlm-citation></ref><ref id="ref35"><label>35</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kwon</surname><given-names>A</given-names> </name><name name-style="western"><surname>Lee</surname><given-names>HY</given-names> </name><name name-style="western"><surname>Shin</surname><given-names>SY</given-names> </name><etal/></person-group><article-title>Current health data standardization project and future directions to ensure interoperability in Korea</article-title><source>Healthc Inform Res</source><year>2024</year><month>04</month><volume>30</volume><issue>2</issue><fpage>93</fpage><lpage>102</lpage><pub-id pub-id-type="doi">10.4258/hir.2024.30.2.93</pub-id><pub-id pub-id-type="medline">38755100</pub-id></nlm-citation></ref><ref id="ref36"><label>36</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Preiksaitis</surname><given-names>C</given-names> </name><name name-style="western"><surname>Sinsky</surname><given-names>CA</given-names> </name><name name-style="western"><surname>Rose</surname><given-names>C</given-names> </name></person-group><article-title>ChatGPT is not the solution to physicians&#x2019; documentation burden</article-title><source>Nat Med</source><year>2023</year><month>06</month><volume>29</volume><issue>6</issue><fpage>1296</fpage><lpage>1297</lpage><pub-id pub-id-type="doi">10.1038/s41591-023-02341-4</pub-id><pub-id pub-id-type="medline">37169865</pub-id></nlm-citation></ref><ref id="ref37"><label>37</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Roberts</surname><given-names>K</given-names> </name></person-group><article-title>Large language models for reducing clinicians&#x2019; documentation burden</article-title><source>Nat Med</source><year>2024</year><month>04</month><volume>30</volume><issue>4</issue><fpage>942</fpage><lpage>943</lpage><pub-id pub-id-type="doi">10.1038/s41591-024-02888-w</pub-id><pub-id pub-id-type="medline">38561439</pub-id></nlm-citation></ref><ref id="ref38"><label>38</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Landman</surname><given-names>AB</given-names> </name><name name-style="western"><surname>Tilak</surname><given-names>SS</given-names> </name><name name-style="western"><surname>Walker</surname><given-names>GA</given-names> </name></person-group><article-title>Artificial intelligence-generated emergency department summaries and hospital handoffs</article-title><source>JAMA Netw Open</source><year>2024</year><month>12</month><day>2</day><volume>7</volume><issue>12</issue><fpage>e2448729</fpage><pub-id pub-id-type="doi">10.1001/jamanetworkopen.2024.48729</pub-id><pub-id pub-id-type="medline">39625728</pub-id></nlm-citation></ref><ref id="ref39"><label>39</label><nlm-citation citation-type="web"><person-group person-group-type="author"><name name-style="western"><surname>Sahni</surname><given-names>N</given-names> </name><name name-style="western"><surname>Stein</surname><given-names>G</given-names> </name><name name-style="western"><surname>Zemmel</surname><given-names>R</given-names> </name><name name-style="western"><surname>Cutler</surname><given-names>DM</given-names> </name></person-group><source>The potential impact of artificial intelligence on healthcare spending</source><year>2023</year><access-date>2025-04-30</access-date><publisher-name>National Bureau of Economic Research Working Paper Series</publisher-name><comment><ext-link ext-link-type="uri" xlink:href="http://www.nber.org/papers/w30857">http://www.nber.org/papers/w30857</ext-link></comment></nlm-citation></ref><ref id="ref40"><label>40</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Liu</surname><given-names>TL</given-names> </name><name name-style="western"><surname>Hetherington</surname><given-names>TC</given-names> </name><name name-style="western"><surname>Dharod</surname><given-names>A</given-names> </name><etal/></person-group><article-title>Does AI-Powered clinical documentation enhance clinician efficiency? A longitudinal study</article-title><source>NEJM AI</source><year>2024</year><month>11</month><day>27</day><volume>1</volume><issue>12</issue><fpage>AIoa2400659</fpage><pub-id pub-id-type="doi">10.1056/AIoa2400659</pub-id></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Multimedia Appendix 1</label><p>Hyperparameter settings for model training.</p><media xlink:href="medinform_v13i1e76848_app1.docx" xlink:title="DOCX File, 24 KB"/></supplementary-material><supplementary-material id="app2"><label>Multimedia Appendix 2</label><p>Untranslated examples of input data types and subsequent output contents of auto-generated drafts.</p><media xlink:href="medinform_v13i1e76848_app2.png" xlink:title="PNG File, 580 KB"/></supplementary-material><supplementary-material id="app3"><label>Multimedia Appendix 3</label><p>Demonstration video for drafting emergency department discharge summaries using the Y-KNOT system.</p><media xlink:href="medinform_v13i1e76848_app3.mp4" xlink:title="MP4 File, 20085 KB"/></supplementary-material><supplementary-material id="app4"><label>Multimedia Appendix 4</label><p>Demonstration video for drafting preanesthetic assessments using the Y-KNOT system.</p><media xlink:href="medinform_v13i1e76848_app4.mp4" xlink:title="MP4 File, 33625 KB"/></supplementary-material><supplementary-material id="app5"><label>Checklist 1</label><p>i-CHECK-DH checklist.</p><media xlink:href="medinform_v13i1e76848_app5.docx" xlink:title="DOCX File, 43 KB"/></supplementary-material></app-group></back></article>