<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="letter" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMI</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Med Inform</journal-id>
      <journal-title>JMIR Medical Informatics</journal-title>
      <issn pub-type="epub">2291-9694</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v13i1e82057</article-id>
      <article-id pub-id-type="pmid">41021270</article-id>
      <article-id pub-id-type="doi">10.2196/82057</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Letter to the Editor</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Letter to the Editor</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Author’s Reply: "Data Contamination in AI Evaluation"</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Iannaccio</surname>
            <given-names>Amanda</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Park</surname>
            <given-names>ChulHyoung</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-0531-9144</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>An</surname>
            <given-names>Min Ho</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-2773-9756</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Hwang</surname>
            <given-names>Gyubeom</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-2293-4555</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Park</surname>
            <given-names>Rae Woong</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <xref rid="aff3" ref-type="aff">3</xref>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-4989-3287</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>An</surname>
            <given-names>Juho</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff5" ref-type="aff">5</xref>
          <address>
            <institution>Department of Emergency Medicine</institution>
            <institution>School of Medicine</institution>
            <institution>Ajou University</institution>
            <addr-line>164 Worldcup-ro</addr-line>
            <addr-line>Yeongtong-gu</addr-line>
            <addr-line>Suwon, 16499</addr-line>
            <country>Republic of Korea</country>
            <phone>82 0312195016</phone>
            <email>ermd.jh@gmail.com</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-7407-426X</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Department of Biomedical Informatics</institution>
        <institution>School of Medicine</institution>
        <institution>Ajou University</institution>
        <addr-line>Suwon</addr-line>
        <country>Republic of Korea</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Center for Biomedical Informatics Research</institution>
        <institution>Ajou University Medical Center</institution>
        <addr-line>Suwon</addr-line>
        <country>Republic of Korea</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Department of Medical Sciences</institution>
        <institution>Graduate School of Ajou University</institution>
        <addr-line>Suwon</addr-line>
        <country>Republic of Korea</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>BK21 R&#38;E Initiative for Advanced Precision Medicine</institution>
        <addr-line>Suwon</addr-line>
        <country>Republic of Korea</country>
      </aff>
      <aff id="aff5">
        <label>5</label>
        <institution>Department of Emergency Medicine</institution>
        <institution>School of Medicine</institution>
        <institution>Ajou University</institution>
        <addr-line>Suwon</addr-line>
        <country>Republic of Korea</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Juho An <email>ermd.jh@gmail.com</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2025</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>29</day>
        <month>9</month>
        <year>2025</year>
      </pub-date>
      <volume>13</volume>
      <elocation-id>e82057</elocation-id>
      <history>
        <date date-type="received">
          <day>15</day>
          <month>8</month>
          <year>2025</year>
        </date>
        <date date-type="accepted">
          <day>20</day>
          <month>8</month>
          <year>2025</year>
        </date>
      </history>
      <copyright-statement>©ChulHyoung Park, Min Ho An, Gyubeom Hwang, Rae Woong Park, Juho An. Originally published in JMIR Medical Informatics (https://medinform.jmir.org), 29.09.2025.</copyright-statement>
      <copyright-year>2025</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Informatics, is properly cited. The complete bibliographic information, a link to the original publication on https://medinform.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://medinform.jmir.org/2025/1/e82057" xlink:type="simple"/>
      <related-article related-article-type="commentary-article" id="v13i1e68409" ext-link-type="doi" xlink:href="10.2196/68409" vol="13" page="e68409" xlink:type="simple">https://medinform.jmir.org/2025/1/e68409/</related-article>
      <related-article related-article-type="commentary-article" id="v13i1e80987" ext-link-type="doi" xlink:href="10.2196/80987" vol="13" page="e80987" xlink:type="simple">http://medinform.jmir.org/2025/1/e80987/</related-article>
      <kwd-group>
        <kwd>artificial intelligence</kwd>
        <kwd>large language model</kwd>
        <kwd>ChatGPT</kwd>
        <kwd>emergency medicine</kwd>
        <kwd>clinical performance examination</kwd>
        <kwd>history taking</kwd>
        <kwd>clinical reasoning</kwd>
        <kwd>empathy</kwd>
        <kwd>patient experience</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <p>We sincerely thank the author for the constructive commentary on our recent publication. Our study evaluated ChatGPT’s performance across multiple dimensions—including history taking, diagnostic accuracy, communication skills, and empathic expression—through a clinical performance examination using simulated patients combined with written examinations [<xref ref-type="bibr" rid="ref1">1</xref>].</p>
    <p>In our study, the written examination was not intended to solely serve as a direct comparison of performance between ChatGPT and human physicians. Rather, it was included to support the interpretation of ChatGPT’s communication skills and empathic responses observed during simulated patient interactions by providing additional context regarding the model’s underlying clinical knowledge. A previous study has shown that patients may perceive ChatGPT’s responses as empathic or trustworthy, even when those responses are clinically inappropriate [<xref ref-type="bibr" rid="ref2">2</xref>]. However, effective clinical communication is not merely about verbal fluency or emotional tone; it must be grounded in adequate medical knowledge. For this reason, earlier studies evaluating artificial intelligence empathy have also assessed the clinical appropriateness of responses and compared them to those of human physicians [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref3">3</xref>].</p>
    <p>Consistent with prior work, we also assessed the simulated patient conversations in terms of both clinical accuracy and empathic engagement, as evaluated by an emergency medicine professor. However, we recognize that physicians vary in their diagnostic styles and communication approaches. Subjective judgment from the evaluator may have influenced the ratings, especially given that the evaluated outputs were full conversations rather than single responses. To provide a complementary and more structured assessment, we incorporated a written test focused on 3 key domains: diagnosis, investigation, and treatment planning. Performance on this test may serve as a supporting element to help ensure that ChatGPT’s interpersonal strengths were not misaligned with clinical reasoning.</p>
    <p>As the author correctly pointed out, the questions in the written examination were adapted from a publicly available textbook published in 2018 [<xref ref-type="bibr" rid="ref4">4</xref>]. We cannot rule out the possibility that ChatGPT was exposed to this material or similar content during pretraining, due to the limited transparency regarding its training data. Therefore, part of the model’s performance on the written test may have been influenced by data contamination. We fully acknowledge this methodological limitation and agree that the results from the written examination should be interpreted with caution.</p>
    <p>We are truly grateful for the author’s thoughtful engagement, which raises important considerations for future studies regarding the assessment of AI in clinical settings.</p>
  </body>
  <back>
    <app-group/>
    <ack>
      <p>During the preparation of this manuscript, the authors used ChatGPT to assist with improving readability and correcting grammatical errors. After using this tool, the authors reviewed and edited the content as needed and take full responsibility for the content of the publication.</p>
    </ack>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Park</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>An</surname>
              <given-names>MH</given-names>
            </name>
            <name name-style="western">
              <surname>Hwang</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Park</surname>
              <given-names>RW</given-names>
            </name>
            <name name-style="western">
              <surname>An</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Clinical performance and communication skills of ChatGPT versus physicians in emergency medicine: simulated patient study</article-title>
          <source>JMIR Med Inform</source>
          <year>2025</year>
          <month>07</month>
          <day>17</day>
          <volume>13</volume>
          <fpage>e68409</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2025//e68409/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/68409</pub-id>
          <pub-id pub-id-type="medline">40674718</pub-id>
          <pub-id pub-id-type="pii">v13i1e68409</pub-id>
          <pub-id pub-id-type="pmcid">PMC12289221</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Armbruster</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Bussmann</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Rothhaas</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Titze</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Grützner</surname>
              <given-names>Paul Alfred</given-names>
            </name>
            <name name-style="western">
              <surname>Freischmidt</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>“Doctor ChatGPT, can you help me?” The patient’s perspective: cross-sectional study</article-title>
          <source>J Med Internet Res</source>
          <year>2024</year>
          <month>10</month>
          <day>01</day>
          <volume>26</volume>
          <fpage>e58831</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2024//e58831/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/58831</pub-id>
          <pub-id pub-id-type="medline">39352738</pub-id>
          <pub-id pub-id-type="pii">v26i1e58831</pub-id>
          <pub-id pub-id-type="pmcid">PMC11480680</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ayers</surname>
              <given-names>JW</given-names>
            </name>
            <name name-style="western">
              <surname>Poliak</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Dredze</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Leas</surname>
              <given-names>EC</given-names>
            </name>
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Kelley</surname>
              <given-names>JB</given-names>
            </name>
            <name name-style="western">
              <surname>Faix</surname>
              <given-names>DJ</given-names>
            </name>
            <name name-style="western">
              <surname>Goodman</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Longhurst</surname>
              <given-names>CA</given-names>
            </name>
            <name name-style="western">
              <surname>Hogarth</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>DM</given-names>
            </name>
          </person-group>
          <article-title>Comparing physician and artificial intelligence chatbot responses to patient questions posted to a public social media forum</article-title>
          <source>JAMA Intern Med</source>
          <year>2023</year>
          <month>06</month>
          <day>01</day>
          <volume>183</volume>
          <issue>6</issue>
          <fpage>589</fpage>
          <lpage>596</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/37115527"/>
          </comment>
          <pub-id pub-id-type="doi">10.1001/jamainternmed.2023.1838</pub-id>
          <pub-id pub-id-type="medline">37115527</pub-id>
          <pub-id pub-id-type="pii">2804309</pub-id>
          <pub-id pub-id-type="pmcid">PMC10148230</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shamil</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Ravi</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Mistry</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <source>100 Cases in Emergency Medicine and Critical Care</source>
          <year>2018</year>
          <publisher-loc>Boca Raton, FL</publisher-loc>
          <publisher-name>CRC Press</publisher-name>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
