<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMI</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Med Inform</journal-id>
      <journal-title>JMIR Medical Informatics</journal-title>
      <issn pub-type="epub">2291-9694</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v9i11e29241</article-id>
      <article-id pub-id-type="pmid">34766919</article-id>
      <article-id pub-id-type="doi">10.2196/29241</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>A Semiautomated Chart Review for Assessing the Development of Radiation Pneumonitis Using Natural Language Processing: Diagnostic Accuracy and Feasibility Study</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Hao</surname>
            <given-names>Tianyong</given-names>
          </name>
        </contrib>
        <contrib contrib-type="editor">
          <name>
            <surname>Huang</surname>
            <given-names>Zhengxing</given-names>
          </name>
        </contrib>
        <contrib contrib-type="editor">
          <name>
            <surname>Tang</surname>
            <given-names>Buzhou</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Gatti</surname>
            <given-names>Mauro</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Park</surname>
            <given-names>Hyungjun</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author">
          <name name-style="western">
            <surname>McKenzie</surname>
            <given-names>Jordan</given-names>
          </name>
          <degrees>BSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-6176-4352</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Rajapakshe</surname>
            <given-names>Rasika</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-2149-7274</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Shen</surname>
            <given-names>Hua</given-names>
          </name>
          <degrees>MMath, PhD</degrees>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-5180-8670</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Rajapakshe</surname>
            <given-names>Shan</given-names>
          </name>
          <degrees>BSc, MSc</degrees>
          <xref rid="aff5" ref-type="aff">5</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-3370-3231</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Lin</surname>
            <given-names>Angela</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <xref rid="aff6" ref-type="aff">6</xref>
          <address>
            <institution>Radiation Oncology</institution>
            <institution>BC Cancer</institution>
            <addr-line>399 Royal Avenue</addr-line>
            <addr-line>Kelowna, BC, V1Y 5L3</addr-line>
            <country>Canada</country>
            <phone>1 250 712 3979</phone>
            <email>angela.lin@bccancer.bc.ca</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-0611-539X</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Northern Medical Program</institution>
        <institution>Faculty of Medicine</institution>
        <institution>University of British Columbia</institution>
        <addr-line>Prince George, BC</addr-line>
        <country>Canada</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Medical Physics</institution>
        <institution>BC Cancer</institution>
        <addr-line>Kelowna, BC</addr-line>
        <country>Canada</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Department of Surgery</institution>
        <institution>Faculty of Medicine</institution>
        <institution>University of British Columbia</institution>
        <addr-line>Vancouver, BC</addr-line>
        <country>Canada</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>Department of Mathematics and Statistics</institution>
        <institution>University of Calgary</institution>
        <addr-line>Calgary, AB</addr-line>
        <country>Canada</country>
      </aff>
      <aff id="aff5">
        <label>5</label>
        <institution>Island Medical Program</institution>
        <institution>Faculty of Medicine</institution>
        <institution>University of British Columbia</institution>
        <addr-line>Victoria, BC</addr-line>
        <country>Canada</country>
      </aff>
      <aff id="aff6">
        <label>6</label>
        <institution>Radiation Oncology</institution>
        <institution>BC Cancer</institution>
        <addr-line>Kelowna, BC</addr-line>
        <country>Canada</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Angela Lin <email>angela.lin@bccancer.bc.ca</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <month>11</month>
        <year>2021</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>12</day>
        <month>11</month>
        <year>2021</year>
      </pub-date>
      <volume>9</volume>
      <issue>11</issue>
      <elocation-id>e29241</elocation-id>
      <history>
        <date date-type="received">
          <day>30</day>
          <month>3</month>
          <year>2021</year>
        </date>
        <date date-type="rev-request">
          <day>19</day>
          <month>5</month>
          <year>2021</year>
        </date>
        <date date-type="rev-recd">
          <day>18</day>
          <month>6</month>
          <year>2021</year>
        </date>
        <date date-type="accepted">
          <day>5</day>
          <month>8</month>
          <year>2021</year>
        </date>
      </history>
      <copyright-statement>©Jordan McKenzie, Rasika Rajapakshe, Hua Shen, Shan Rajapakshe, Angela Lin. Originally published in JMIR Medical Informatics (https://medinform.jmir.org), 12.11.2021.</copyright-statement>
      <copyright-year>2021</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Informatics, is properly cited. The complete bibliographic information, a link to the original publication on https://medinform.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://medinform.jmir.org/2021/11/e29241" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Health research frequently requires manual chart reviews to identify patients in a study-specific cohort and examine their clinical outcomes. Manual chart review is a labor-intensive process that requires significant time investment for clinical researchers.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>This study aims to evaluate the feasibility and accuracy of an assisted chart review program, using an in-house rule-based text-extraction program written in Python, to identify patients who developed radiation pneumonitis (RP) after receiving curative radiotherapy.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>A retrospective manual chart review was completed for patients who received curative radiotherapy for stage 2-3 lung cancer from January 1, 2013 to December 31, 2015, at British Columbia Cancer, Kelowna Centre. In the manual chart review, RP diagnosis and grading were recorded using the Common Terminology Criteria for Adverse Events version 5.0. From the charts of 50 sample patients, a total of 1413 clinical documents were obtained for review from the electronic medical record system. The text-extraction program was built using the Natural Language Toolkit Python platform (and regular expressions, also known as RegEx). Python version 3.7.2 was used to run the text-extraction program. The output of the text-extraction program was a list of the full sentences containing the key terms, document IDs, and dates from which these sentences were extracted. The results from the manual review were used as the gold standard in this study, with which the results of the text-extraction program were compared.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>Fifty percent (25/50) of the sample patients developed grade ≥1 RP; the natural language processing program was able to ascertain 92% (23/25) of these patients (sensitivity 0.92, 95% CI 0.74-0.99; specificity 0.36, 95% CI 0.18-0.57). Furthermore, the text-extraction program was able to correctly identify all 9 patients with grade ≥2 RP, which are patients with clinically significant symptoms (sensitivity 1.0, 95% CI 0.66-1.0; specificity 0.27, 95% CI 0.14-0.43). The program was useful for distinguishing patients with RP from those without RP. The text-extraction program in this study avoided unnecessary manual review of 22% (11/50) of the sample patients, as these patients were identified as grade 0 RP and would not require further manual review in subsequent studies.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>This feasibility study showed that the text-extraction program was able to assist with the identification of patients who developed RP after curative radiotherapy. The program streamlines the manual chart review further by identifying the key sentences of interest. This work has the potential to improve future clinical research, as the text-extraction program shows promise in performing chart review in a more time-efficient manner, compared with the traditional labor-intensive manual chart review.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>chart review</kwd>
        <kwd>natural language processing</kwd>
        <kwd>text extraction</kwd>
        <kwd>radiation pneumonitis</kwd>
        <kwd>lung cancer</kwd>
        <kwd>radiation therapy</kwd>
        <kwd>python</kwd>
        <kwd>electronic medical record</kwd>
        <kwd>accuracy</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <sec>
        <title>Background</title>
        <p>Retrospective chart reviews require the analysis of pre-existing clinical data to answer a research question. To identify the patient cohort of interest, researchers often need to use certain inclusion criteria to scan a large <italic>database</italic>. After the patient cohort is identified, data abstraction begins, and a number of patient variables can be collected [<xref ref-type="bibr" rid="ref1">1</xref>-<xref ref-type="bibr" rid="ref3">3</xref>]. For example, cancer research frequently uses chart reviews to examine the outcomes and specific side effects of therapies. Radiation pneumonitis (RP) is a potential side effect of radiation therapy (RT) in patients with lung cancer, which can lead to permanent lung damage visible on radiography (<xref rid="figure1" ref-type="fig">Figure 1</xref>) [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref5">5</xref>]. Patients with RP may develop supplemental oxygen dependence and have a lower quality of life; as such, it is an important outcome to consider after RT and important to understand factors that may increase or decrease the likelihood of its development [<xref ref-type="bibr" rid="ref4">4</xref>]. Of the patients with lung cancer treated with RT, it is expected that approximately 10% to 20% will develop moderate to severe RP [<xref ref-type="bibr" rid="ref6">6</xref>-<xref ref-type="bibr" rid="ref9">9</xref>]. Although RP fatality is uncommon, it still occurs in 1.9% of those affected [<xref ref-type="bibr" rid="ref10">10</xref>]. For selecting a cohort of patients who developed symptomatic RP, the charts of patients with stage 2-3 lung cancer who received curative RT during the study period must be reviewed. In a typical manual chart review, this would involve researchers going through patient charts and looking for evidence and severity of RP diagnosis based on the Common Terminology Criteria for Adverse Events (CTCAE) version 5.0 [<xref ref-type="bibr" rid="ref9">9</xref>]. This process takes significant human resources and time to identify the patient cohort of interest [<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref12">12</xref>]. The time requirement is amplified in cohorts that have a small representation in the larger data set, where a much larger data set is necessary to be reviewed to find a significant number of rare events [<xref ref-type="bibr" rid="ref12">12</xref>]. This decreases the chart review productivity, where a high percentage of the chart review process will be unfruitful in identifying patients for the cohort and can be seen as a loss of valuable research time. Our goal is to use a computer program developed in-house to assist in the identification of the cohort of interest and move toward an automated chart review process.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Color wash of the dose distribution on a radiation therapy planning computed tomography for a patient with lung cancer (left). The blue edge represents the 20 gray dose line, which is the recognized dose associated with increased risk of radiation pneumonitis. The same patient’s 3-month follow-up computed tomography image showed opacity indicating a partial filling of the air spaces in the lungs. These radiologic changes are representative of radiation pneumonitis in the radiation field (right).</p>
          </caption>
          <graphic xlink:href="medinform_v9i11e29241_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <p>The most recent and sophisticated computer programs designed to assist in chart review studies have implemented natural language processing (NLP) [<xref ref-type="bibr" rid="ref13">13</xref>-<xref ref-type="bibr" rid="ref16">16</xref>]. NLP is a computer model that can manipulate a document's narrative text and speech, also known as natural language, and export it in a structured format for analysis [<xref ref-type="bibr" rid="ref16">16</xref>]. This type of modeling is necessary because of the nature of electronic medical records (EMRs). Typically, patient charts in the EMR are written in a narrative text format, which is more difficult for a computer program to extract information from compared with a structured charting system that is arranged in tables [<xref ref-type="bibr" rid="ref17">17</xref>]. It has been estimated that up to 80% of health care data are in an unstructured narrative format within most EMR systems [<xref ref-type="bibr" rid="ref18">18</xref>]. Using an NLP computer algorithm as a tool could enable a chart review to be completed in less time with less human resources.</p>
      </sec>
      <sec>
        <title>Objective</title>
        <p>The objective of this study is to evaluate the feasibility and accuracy of an in-house developed rule-based text-extraction program written in Python to identify patients with lung cancer who developed RP after receiving curative RT. This rule-based text-extraction program written in Python is the first stage of developing a more robust NLP program. RP is an important factor to consider with respect to RT and serves as a marker for treatment-specific variables and allows us to evaluate the use of the text-extraction program. Specifically, the focus of identification in this study is on clinically significant cases of grade ≥2 RP. RP is graded by severity; if the patient’s quality of life is affected by shortness of breath and cough, it is grade ≥2, whereas grade 1 RP is only seen on imaging and is not associated with any symptoms (<xref ref-type="boxed-text" rid="box1">Textbox 1</xref>) [<xref ref-type="bibr" rid="ref9">9</xref>].</p>
        <boxed-text id="box1" position="float">
          <title>Radiation pneumonitis (RP) grading based on Common Terminology Criteria for Adverse Events version 5.0.</title>
          <p>
            <bold>Grade 0</bold>
          </p>
          <list list-type="bullet">
            <list-item>
              <p>No RP present</p>
            </list-item>
          </list>
          <p>
            <bold>Grade 1</bold>
          </p>
          <list list-type="bullet">
            <list-item>
              <p>Asymptomatic; clinical or diagnostic observations only; intervention not indicated</p>
            </list-item>
          </list>
          <p>
            <bold>Grade 2</bold>
          </p>
          <list list-type="bullet">
            <list-item>
              <p>Symptomatic; medical intervention indicated; limiting instrumental activities of daily living</p>
            </list-item>
          </list>
          <p>
            <bold>Grade 3</bold>
          </p>
          <list list-type="bullet">
            <list-item>
              <p>Severe symptoms; limiting self-care activities of daily living; oxygen indicated</p>
            </list-item>
          </list>
          <p>
            <bold>Grade 4</bold>
          </p>
          <list list-type="bullet">
            <list-item>
              <p>Life-threatening respiratory compromise; urgent intervention indicated (eg, tracheotomy or intubation)</p>
            </list-item>
          </list>
          <p>
            <bold>Grade 5</bold>
          </p>
          <list list-type="bullet">
            <list-item>
              <p>Death</p>
            </list-item>
          </list>
        </boxed-text>
      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Recruitment</title>
        <p>The study population included a sample subset of 50 patients, from those who received curative RT for stage 2-3 non–small cell lung cancer from January 1, 2013, to December 31, 2015, at British Columbia (BC) Cancer Kelowna. The sample subset was designed to represent the proportions of RP grades in the literature [<xref ref-type="bibr" rid="ref6">6</xref>-<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref19">19</xref>]. However, there is a lack of consensus on the proportions of RP grades among patients treated with RT, most likely because of the numerous variables identified in contributing to RP development, including age, RT dose, concurrent chemotherapy, and underlying comorbidities such as chronic obstructive pulmonary disease [<xref ref-type="bibr" rid="ref6">6</xref>-<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref19">19</xref>]. The sample subset represents the proportion of RP grades most likely to be encountered in a larger randomized data set. Once the proportions of RP grade were decided on for the cohort based on the literature, simple random sampling without replacement was done on the manually reviewed cohort.</p>
      </sec>
      <sec>
        <title>Data Exclusion</title>
        <p>Patients who underwent surgery after radiation treatment were excluded. Patients who received palliative radiation and patients with small cell lung cancer were excluded.</p>
      </sec>
      <sec>
        <title>Workflow</title>
        <p>A manual chart review was completed by reviewing patient charts from the institutional EMR at BC Cancer Kelowna. The manual chart review results served as the definitive diagnosis, with which the assisted chart review program was compared. In the manual chart review, RP diagnosis and grading were recorded using CTCAE version 5.0 (<xref ref-type="boxed-text" rid="box1">Textbox 1</xref>) [<xref ref-type="bibr" rid="ref9">9</xref>].</p>
        <p>The in-house text-extraction program was built using the Natural Language Toolkit Python platform (and regular expressions, also known as RegEx). Patient charts were extracted from the BC Cancer EMR system and were subsequently formatted into the American Standard Code for Information Interchange text files to be compatible with the text-extraction program. From the charts of 50 sample patients, a total of 1413 clinical documents (clinical notes and radiology reports) were obtained for review. The reports from the BC Cancer EMR system were obtained by either direct conversion to text format documents or were printed in PDF and then converted to text format using the open-source Python Tesseract optical character recognition program. This step of obtaining and converting the documents to text format from the BC Cancer EMR system was necessary, as the text-extraction program input requires text format documents. Python version 3.7.2 was used to run the assisted chart review text-extraction program. The terms <italic>pneumonitis</italic>, <italic>radiation pneumonitis</italic>, <italic>radiation induced lung injury</italic>, and <italic>fibrosis</italic> were used as key terms for the assisted chart review. These key terms were chosen by the radiation oncologist contributing clinical expertise in this study, and they represent terminology that a physician would use to identify RP in dictated reports. The output of the text-extraction program was a list of full sentences containing the key terms, along with the document IDs and dates from which these sentences were extracted. The text-extraction program was designed to search through all the charts and extract the whole sentence that contained the key terms. If a sentence was extracted from a patient’s chart, the patient was identified as having RP. The text-extraction program organized the extracted information, identified the patients, and indicated the exact documents containing the key terms. The results from the text-extraction program were then compared with those from the manual chart review.</p>
        <p>If the text-extraction program is shown to be feasible and accurate, a more expedited manual chart review can be performed using the results of the text-extraction program in future studies. Patients with no key terms identified in their charts will be designated as grade 0 RP, and no further chart review of these patients will need to be completed. For the patients identified by the text-extraction program to have RP, the sentences containing the key terms can be reviewed manually, first to confirm that these patients are correctly identified as having RP, and then to grade the RP severity in an expedited manner. Thus, there is an opportunity to improve the text-extraction program specificity during this sentence review process by correcting the false-positive cases.</p>
      </sec>
      <sec>
        <title>Statistical Analysis</title>
        <p>The comparison between the manual chart review and text-extraction program output was viewed and analyzed in 2 different ways: the first approach considered the diseased state to be grade ≥1 RP, and the second approach considered the diseased state to be grade ≥2 RP, with grade 1 RP classified as a healthy state as the patients with grade 1 RP had no clinical symptoms. The text-extraction program was designed to look for any grade of RP when searching through the patient charts, so this lends itself to being able to perform well during the first analysis. However, grade 1 RP is only visible radiographically and thus is not clinically relevant to a patient’s further care. Thus, we wanted to look at how well the assisted chart review system was able to identify patients with symptomatic RP. Statistical analyses were performed using SAS software version 9.4.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Text-Extraction Program Output</title>
        <p>The results of the text-extraction program used to identify patients with RP of any grade are shown in <xref ref-type="table" rid="table1">Tables 1</xref> and <xref ref-type="table" rid="table2">2</xref>. The text-extraction program was able to ascertain 92% (23/25) of patients who developed grade ≥1 RP (sensitivity 0.92, 95% CI 0.74-0.99; specificity 0.36, 95% CI 0.18-0.57). The results of the text-extraction program used to identify patients with symptomatic RP, that is, grade ≥2, is shown in <xref ref-type="table" rid="table3">Table 3</xref>. The text-extraction program was able to correctly identify all 9 patients with grade ≥2 RP (sensitivity 1.0, 95% CI 0.66-1.0; specificity 0.27, 95% CI 0.14-0.43). Both analyses revealed that the text-extraction program was capable of significantly differentiating between the diseased and healthy groups.</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>The assisted chart review text-extraction program results and the accuracy for each RP grade.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="330"/>
            <col width="290"/>
            <col width="380"/>
            <thead>
              <tr valign="top">
                <td>RP severity (grade)</td>
                <td>Total, N</td>
                <td>Correctly identified, n (%)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>0</td>
                <td>25</td>
                <td>9 (36)</td>
              </tr>
              <tr valign="top">
                <td>1</td>
                <td>16</td>
                <td>14 (88)</td>
              </tr>
              <tr valign="top">
                <td>2</td>
                <td>7</td>
                <td>7 (100)</td>
              </tr>
              <tr valign="top">
                <td>3</td>
                <td>2</td>
                <td>2 (100)</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>The assisted chart review text-extraction program results for differentiating between patients with radiation pneumonitis (RP) of grade 0 (healthy) versus those with RP of grade ≥1 (diseased).</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="320"/>
            <col width="230"/>
            <col width="280"/>
            <col width="170"/>
            <thead>
              <tr valign="top">
                <td>Text-extraction program findings</td>
                <td colspan="3">Manual chart review finding</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Healthy (grade 0 RP), n (%)</td>
                <td>Diseased (grade ≥1 RP), n (%)</td>
                <td>Total, N</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Healthy (grade 0 RP)</td>
                <td>9 (18)</td>
                <td>2 (4)</td>
                <td>11</td>
              </tr>
              <tr valign="top">
                <td>Diseased (grade ≥1 RP)</td>
                <td>16 (32)</td>
                <td>23 (46)</td>
                <td>39</td>
              </tr>
              <tr valign="top">
                <td>Total</td>
                <td>25 (50)</td>
                <td>25 (50)</td>
                <td>50</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>The assisted chart review text-extraction program results looking at the ability to distinguish between patients with radiation pneumonitis (RP) of grade ≤1 (healthy) and those with of grade ≥2 (diseased).</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="320"/>
            <col width="260"/>
            <col width="280"/>
            <col width="140"/>
            <thead>
              <tr valign="top">
                <td>Text-extraction program findings</td>
                <td colspan="3">Manual chart review finding</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Healthy (grade ≤1 RP), n (%)</td>
                <td>Diseased (grade ≥2 RP), n (%)</td>
                <td>Total, N</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Healthy (grade ≤1 RP)</td>
                <td>11 (22)</td>
                <td>0 (0)</td>
                <td>11</td>
              </tr>
              <tr valign="top">
                <td>Diseased (grade ≥2 RP)</td>
                <td>30 (60)</td>
                <td>9 (18)</td>
                <td>39</td>
              </tr>
              <tr valign="top">
                <td>Total</td>
                <td>41 (82)</td>
                <td>9 (18)</td>
                <td>50</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <p>The text-extraction program missed 2 patients with grade 1 RP. Upon further review, the 2 patients with grade 1 RP that the text-extraction program <italic>missed</italic> were found to truly have grade 0 RP but were incorrectly labeled as patients with RP because of human error in the manual chart review. If we correct for this human error, the sensitivity improves to 1.0 for the text-extraction program’s ability to identify grade ≥1 RP.</p>
      </sec>
      <sec>
        <title>Clinical Utility</title>
        <p>In our cohort, each patient’s chart consisted of an average of 28 clinical documents that make up their chart, with a range of 15 to 150 documents. The average time spent during the manual chart review of one patient’s chart was 30 minutes. Therefore, the manual chart review of the 50-patient cohort took 25 hours. In comparison, the assisted chart review text-extraction program processed the 1413 clinical documents and exported the results in &#60;5 minutes.</p>
        <p>The use of the text-extraction program in this study would be to avoid unnecessary manual review of 22% (11/50) of the sample, including their electronic documents (198/1413, 14%), as these patients were identified as not having RP and thus would not require any manual review. It will also streamline the rest of the manual review as key sentences with the key terms are identified, thus further reducing the number of clinical documents necessary for the manual review to confirm that the patient should be included in the cohort.</p>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>The text-extraction program was able to identify patients with RP with high sensitivity but, unfortunately, low specificity. This can assist in the identification of a patient cohort of interest in a more efficient manner.</p>
        <p>The text-extraction program correctly identified 2 patients with grade 0 RP that the manual chart review incorrectly identified. Similar findings have been reported in the literature, where one study found that their automated chart review outperformed their manual chart review as the human reviewer missed the correct classification on manual evaluation of the chart [<xref ref-type="bibr" rid="ref11">11</xref>]. Therefore, although the gold standard for assessing the accuracy of the text-extraction program in this study is manual chart review, the process is very tedious and not guaranteed to be perfect because of human error [<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref20">20</xref>]. This highlights a potential advantage of the text-extraction program at being more accurate than the human-led manual chart review.</p>
        <p>The utility of the text-extraction program in this study would be to perform a rapid scan of a larger data set of documents and avoid unnecessary manual review of many of the non-RP patient charts. The program is able to use key terms, such as RP or fibrosis, to return a list of patients with those terms in the patient charts. This will significantly cut down on the number of charts that the manual review will include. This is mainly because of the fact that even if a patient does develop RP, most of their charts do not include any indication of their diagnosis. The computer program organizes the extracted information into which patient and which exact chart, thus further reducing the amount of chart review that is necessary to manually review to confirm that the patient should be included in our cohort.</p>
        <p>The end goal of using text-extraction programs to perform chart reviews is to save the researcher time and effort of combing through patient charts to form a cohort in which to begin studying a clinical outcome. Our text-extraction program was able to output its results in &#60;5 minutes compared with the 25 hours it took the manual chart review control to create the RP cohort.</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>A limitation to implementing this assisted chart review program is its current high false-positive rate, leading to unnecessary chart review of patients with no RP. The development of automated chart reviews must consider the balance between NLP program accuracy (no diseased cases missed) versus the amount of time saved by confidently eliminating true RP grade 0 patients in the review. Designing the key terms was an important process to balance the accuracy of the text-extraction program versus the time saved using the text-extraction program. Selecting broad key terms is important to capture all patients who may fall into our cohort; however, more specific key terms would better rule out patients not within the study cohort. Our goal was to maximize the sensitivity of the text-extraction program by including broad terms so as to not miss any patients with the diseased state initially, as the sentence output of the text-extraction program allows for a truncated chart review to improve the specificity. This means that the possible time saved in this feasibility study was less as more false-positive RP patients were identified. Future work is underway to improve the specificity of the text-extraction program with a larger sample.</p>
        <p>Another limitation of our work is the small sample size of 50 patients. This sample group was used as a proof of concept for our in-house developed text-extraction program. This study’s results will guide further refinement of the text-extraction program and validation with a larger sample of patients.</p>
        <p>The rule-based text-extraction program used in this study still requires human involvement in a number of steps. The clinical documents in the BC Cancer EMR system had to be obtained manually rather than automatically, which continues to pose a barrier in making chart review research as time efficient as possible.</p>
        <p>In addition, it is important to point out that expert opinions were necessary to identify the key terms to be used in the text-extraction program. This is not only another human involvement requirement but also indicates that the results are dependent on the quality of the expert. In addition, this makes the program less generalizable to other cohorts without a new expert to create the proper key terms for each specific cohort.</p>
      </sec>
      <sec>
        <title>Comparison With Previous Work</title>
        <p>Other studies have used NLP programs to assist with chart reviews in many scopes of medicine, including respirology, cardiology, and neurosurgery, and now our cancer research to identify patients who developed RP [<xref ref-type="bibr" rid="ref21">21</xref>-<xref ref-type="bibr" rid="ref24">24</xref>]. NLP has different applications in medical research, such as identifying patient cohorts such as our study and similar studies that identified cohorts of progressive heart failure and patients with asthma [<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref22">22</xref>]. Other studies have used NLP programs to extract specific clinical features from clinical charts, such as tuberculosis patient factors and radiology characteristics of glioblastoma [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref24">24</xref>]. Our use of an NLP program to extract information based on key terms to reduce the amount of chart review necessary is similar to the study by Cao et al [<xref ref-type="bibr" rid="ref25">25</xref>], where they used search terms to identify medical errors through patient charts. This allowed their group to reduce the number of charts that needed to be reviewed, from 286,000 discharge summaries to 2744 discharge summaries that were found to contain the search terms [<xref ref-type="bibr" rid="ref25">25</xref>]. This meant that the Cao et al [<xref ref-type="bibr" rid="ref25">25</xref>] manual review only had to be done on &#60;1% of the initial data set. Reducing the number of charts to review saves many hours of manual chart review and would greatly increase the speed at which the review could be completed. Thus, an assisted chart review program opens the possibility of expanding the study, including a much larger data set that would be impractical to review manually. Our study adds to the existing literature on this topic by supporting the validity of NLP programs; it demonstrates the ability to further analyze an identified patient cohort based on variables of interest, such as illness severity.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>In conclusion, the NLP-based text-extraction program used in this study is a feasible and valuable method for identifying patients who developed RP after curative radiotherapy. First, the text-extraction program helped save chart review time by completely eliminating patient charts identified with grade 0 RP. Second, the text-extraction program extracted key sentences from patient charts and allowed for an efficient review of relevant phrases, should this be needed to grade patients’ RP severity without having to peruse the rest of their charts. For example, in a quick scan, a researcher would be able to read only the sentences with the identified keyword in a patient’s chart instead of sifting through many full documents.</p>
        <p>The analysis revealed that the text-extraction program was capable of significantly differentiating between diseased and healthy groups. Compared with the manual chart review of the 50-patient cohort that took 25 hours, the text-extraction program was able to process all the charts in &#60;5 minutes and exported the list of patients that had RP mentioned somewhere in their chart.</p>
        <p>This work has the potential to improve future clinical research as the text-extraction program shows promise in performing chart review in a more time- and effort-efficient manner compared with the traditional manual chart review. The text-extraction program is available by contacting the authors (RR).</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group/>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">BC</term>
          <def>
            <p>British Columbia</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">CTCAE</term>
          <def>
            <p>Common Terminology Criteria for Adverse Events</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">EMR</term>
          <def>
            <p>electronic medical record</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">NLP</term>
          <def>
            <p>natural language processing</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">RP</term>
          <def>
            <p>radiation pneumonitis</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">RT</term>
          <def>
            <p>radiation therapy</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>This study received funding support from the British Columbia Cancer Foundation and the University of British Columbia Faculty of Medicine. The authors thank Jinying Wu for statistical analysis support.</p>
    </ack>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Worster</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Haines</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Advanced statistics: understanding medical record review (MRR) studies</article-title>
          <source>Acad Emerg Med</source>
          <year>2004</year>
          <month>02</month>
          <volume>11</volume>
          <issue>2</issue>
          <fpage>187</fpage>
          <lpage>92</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://onlinelibrary.wiley.com/resolve/openurl?genre=article&#38;sid=nlm:pubmed&#38;issn=1069-6563&#38;date=2004&#38;volume=11&#38;issue=2&#38;spage=187"/>
          </comment>
          <pub-id pub-id-type="medline">14759964</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Panacek</surname>
              <given-names>EA</given-names>
            </name>
          </person-group>
          <article-title>Performing chart review studies</article-title>
          <source>Air Med J</source>
          <year>2007</year>
          <volume>26</volume>
          <issue>5</issue>
          <fpage>206</fpage>
          <lpage>10</lpage>
          <pub-id pub-id-type="doi">10.1016/j.amj.2007.06.007</pub-id>
          <pub-id pub-id-type="medline">17765825</pub-id>
          <pub-id pub-id-type="pii">S1067-991X(07)00160-5</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gearing</surname>
              <given-names>RE</given-names>
            </name>
            <name name-style="western">
              <surname>Mian</surname>
              <given-names>IA</given-names>
            </name>
            <name name-style="western">
              <surname>Barber</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Ickowicz</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>A methodology for conducting retrospective chart review research in child and adolescent psychiatry</article-title>
          <source>J Can Acad Child Adolesc Psychiatry</source>
          <year>2006</year>
          <month>08</month>
          <volume>15</volume>
          <issue>3</issue>
          <fpage>126</fpage>
          <lpage>34</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/18392182"/>
          </comment>
          <pub-id pub-id-type="medline">18392182</pub-id>
          <pub-id pub-id-type="pmcid">PMC2277255</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Weytjens</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Erven</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>De Ruysscher</surname>
              <given-names>RD</given-names>
            </name>
          </person-group>
          <article-title>Radiation pneumonitis: occurrence, prediction, prevention and treatment</article-title>
          <source>Belg J Med Oncol</source>
          <year>2013</year>
          <month>9</month>
          <volume>7</volume>
          <issue>4</issue>
          <fpage>105</fpage>
          <lpage>10</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.ariez.nl/wp-content/uploads/2018/08/105-10-1.pdf"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kainthola</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Haritwal</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Tiwari</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Gupta</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Parvez</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Tiwari</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Prakash</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Agrawala</surname>
              <given-names>PK</given-names>
            </name>
          </person-group>
          <article-title>Immunological aspect of radiation-induced pneumonitis, current treatment strategies, and future prospects</article-title>
          <source>Front Immunol</source>
          <year>2017</year>
          <month>5</month>
          <day>2</day>
          <volume>8</volume>
          <fpage>506</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.3389/fimmu.2017.00506"/>
          </comment>
          <pub-id pub-id-type="doi">10.3389/fimmu.2017.00506</pub-id>
          <pub-id pub-id-type="medline">28512460</pub-id>
          <pub-id pub-id-type="pmcid">PMC5411429</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liang</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Yan</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Tian</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Yan</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Dai</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Dosiomics: extracting 3d spatial features from dose distribution to predict incidence of radiation pneumonitis</article-title>
          <source>Front Oncol</source>
          <year>2019</year>
          <month>4</month>
          <day>12</day>
          <volume>9</volume>
          <fpage>269</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.3389/fonc.2019.00269"/>
          </comment>
          <pub-id pub-id-type="doi">10.3389/fonc.2019.00269</pub-id>
          <pub-id pub-id-type="medline">31032229</pub-id>
          <pub-id pub-id-type="pmcid">PMC6473398</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Moreno</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Aristu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Ramos</surname>
              <given-names>LI</given-names>
            </name>
            <name name-style="western">
              <surname>Arbea</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>López-Picazo</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Cambeiro</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Martínez-Monge</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Predictive factors for radiation-induced pulmonary toxicity after three-dimensional conformal chemoradiation in locally advanced non-small-cell lung cancer</article-title>
          <source>Clin Transl Oncol</source>
          <year>2007</year>
          <month>09</month>
          <volume>9</volume>
          <issue>9</issue>
          <fpage>596</fpage>
          <lpage>602</lpage>
          <pub-id pub-id-type="doi">10.1007/s12094-007-0109-1</pub-id>
          <pub-id pub-id-type="medline">17921108</pub-id>
          <pub-id pub-id-type="pii">1084</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Anthony</surname>
              <given-names>GJ</given-names>
            </name>
            <name name-style="western">
              <surname>Cunliffe</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Castillo</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Pham</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Guerrero</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Armato</surname>
              <given-names>SG</given-names>
            </name>
            <name name-style="western">
              <surname>Al-Hallaq</surname>
              <given-names>HA</given-names>
            </name>
          </person-group>
          <article-title>Incorporation of pre-therapy F-FDG uptake data with CT texture features into a radiomics model for radiation pneumonitis diagnosis</article-title>
          <source>Med Phys</source>
          <year>2017</year>
          <month>07</month>
          <volume>44</volume>
          <issue>7</issue>
          <fpage>3686</fpage>
          <lpage>94</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/28422299"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/mp.12282</pub-id>
          <pub-id pub-id-type="medline">28422299</pub-id>
          <pub-id pub-id-type="pmcid">PMC5503160</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="web">
          <article-title>Common Terminology Criteria for Adverse Events (CTCAE) Version 5.0</article-title>
          <source>NIH National Cancer Institute</source>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://ctep.cancer.gov/protocolDevelopment/electronic_applications/ctc.htm#ctc_50">https://ctep.cancer.gov/protocolDevelopment/electronic_applications/ctc.htm#ctc_50</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Palma</surname>
              <given-names>DA</given-names>
            </name>
            <name name-style="western">
              <surname>Senan</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Tsujino</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Barriger</surname>
              <given-names>RB</given-names>
            </name>
            <name name-style="western">
              <surname>Rengan</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Moreno</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Bradley</surname>
              <given-names>JD</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>TH</given-names>
            </name>
            <name name-style="western">
              <surname>Ramella</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Marks</surname>
              <given-names>LB</given-names>
            </name>
            <name name-style="western">
              <surname>De Petris</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Stitt</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Rodrigues</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Predicting radiation pneumonitis after chemoradiation therapy for lung cancer: an international individual patient data meta-analysis</article-title>
          <source>Int J Radiat Oncol Biol Phys</source>
          <year>2013</year>
          <month>02</month>
          <day>01</day>
          <volume>85</volume>
          <issue>2</issue>
          <fpage>444</fpage>
          <lpage>50</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/22682812"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.ijrobp.2012.04.043</pub-id>
          <pub-id pub-id-type="medline">22682812</pub-id>
          <pub-id pub-id-type="pii">S0360-3016(12)00640-2</pub-id>
          <pub-id pub-id-type="pmcid">PMC3448004</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Duz</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Marshall</surname>
              <given-names>JF</given-names>
            </name>
            <name name-style="western">
              <surname>Parkin</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Validation of an improved computer-assisted technique for mining free-text electronic medical records</article-title>
          <source>JMIR Med Inform</source>
          <year>2017</year>
          <month>06</month>
          <day>29</day>
          <volume>5</volume>
          <issue>2</issue>
          <fpage>e17</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2017/2/e17/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/medinform.7123</pub-id>
          <pub-id pub-id-type="medline">28663163</pub-id>
          <pub-id pub-id-type="pii">v5i2e17</pub-id>
          <pub-id pub-id-type="pmcid">PMC5509949</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dipaola</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Gatti</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Pacetti</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Bottaccioli</surname>
              <given-names>AG</given-names>
            </name>
            <name name-style="western">
              <surname>Shiffer</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Minonzio</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Menè</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Giaj Levra</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Solbiati</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Costantino</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Anastasio</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Sini</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Barbic</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Brunetta</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Furlan</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Artificial intelligence algorithms and natural language processing for the recognition of syncope patients on emergency department medical records</article-title>
          <source>J Clin Med</source>
          <year>2019</year>
          <month>10</month>
          <day>14</day>
          <volume>8</volume>
          <issue>10</issue>
          <fpage>1677</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=jcm8101677"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/jcm8101677</pub-id>
          <pub-id pub-id-type="medline">31614982</pub-id>
          <pub-id pub-id-type="pii">jcm8101677</pub-id>
          <pub-id pub-id-type="pmcid">PMC6832155</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hardjojo</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Gunachandran</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Pang</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Abdullah</surname>
              <given-names>MR</given-names>
            </name>
            <name name-style="western">
              <surname>Wah</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Chong</surname>
              <given-names>JW</given-names>
            </name>
            <name name-style="western">
              <surname>Goh</surname>
              <given-names>EH</given-names>
            </name>
            <name name-style="western">
              <surname>Teo</surname>
              <given-names>SH</given-names>
            </name>
            <name name-style="western">
              <surname>Lim</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>ML</given-names>
            </name>
            <name name-style="western">
              <surname>Hsu</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>MI</given-names>
            </name>
            <name name-style="western">
              <surname>Wong</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Phang</surname>
              <given-names>JS</given-names>
            </name>
          </person-group>
          <article-title>Validation of a natural language processing algorithm for detecting infectious disease symptoms in primary care electronic medical records in singapore</article-title>
          <source>JMIR Med Inform</source>
          <year>2018</year>
          <month>06</month>
          <day>11</day>
          <volume>6</volume>
          <issue>2</issue>
          <fpage>e36</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2018/2/e36/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/medinform.8204</pub-id>
          <pub-id pub-id-type="medline">29907560</pub-id>
          <pub-id pub-id-type="pii">v6i2e36</pub-id>
          <pub-id pub-id-type="pmcid">PMC6026305</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Suominen</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Gedeon</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Adapting state-of-the-art deep language models to clinical information extraction systems: potentials, challenges, and solutions</article-title>
          <source>JMIR Med Inform</source>
          <year>2019</year>
          <month>04</month>
          <day>25</day>
          <volume>7</volume>
          <issue>2</issue>
          <fpage>e11499</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2019/2/e11499/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/11499</pub-id>
          <pub-id pub-id-type="medline">31021325</pub-id>
          <pub-id pub-id-type="pii">v7i2e11499</pub-id>
          <pub-id pub-id-type="pmcid">PMC6658232</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zheng</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Jabbour</surname>
              <given-names>SK</given-names>
            </name>
            <name name-style="western">
              <surname>O'Reilly</surname>
              <given-names>SE</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>JJ</given-names>
            </name>
            <name name-style="western">
              <surname>Dong</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Ding</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Xiao</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Yue</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Zou</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>Automated information extraction on treatment and prognosis for non-small cell lung cancer radiotherapy patients: clinical study</article-title>
          <source>JMIR Med Inform</source>
          <year>2018</year>
          <month>02</month>
          <day>01</day>
          <volume>6</volume>
          <issue>1</issue>
          <fpage>e8</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2018/1/e8/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/medinform.8662</pub-id>
          <pub-id pub-id-type="medline">29391345</pub-id>
          <pub-id pub-id-type="pii">v6i1e8</pub-id>
          <pub-id pub-id-type="pmcid">PMC5814605</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Usui</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Aramaki</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Iwao</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Wakamiya</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Sakamoto</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Mochizuki</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Extraction and standardization of patient complaints from electronic medication histories for pharmacovigilance: natural language processing analysis in japanese</article-title>
          <source>JMIR Med Inform</source>
          <year>2018</year>
          <month>09</month>
          <day>27</day>
          <volume>6</volume>
          <issue>3</issue>
          <fpage>e11021</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2018/3/e11021/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/11021</pub-id>
          <pub-id pub-id-type="medline">30262450</pub-id>
          <pub-id pub-id-type="pii">v6i3e11021</pub-id>
          <pub-id pub-id-type="pmcid">PMC6231790</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tignanelli</surname>
              <given-names>CJ</given-names>
            </name>
            <name name-style="western">
              <surname>Silverman</surname>
              <given-names>GM</given-names>
            </name>
            <name name-style="western">
              <surname>Lindemann</surname>
              <given-names>EA</given-names>
            </name>
            <name name-style="western">
              <surname>Trembley</surname>
              <given-names>AL</given-names>
            </name>
            <name name-style="western">
              <surname>Gipson</surname>
              <given-names>JC</given-names>
            </name>
            <name name-style="western">
              <surname>Beilman</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Lyng</surname>
              <given-names>JW</given-names>
            </name>
            <name name-style="western">
              <surname>Finzel</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>McEwan</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Knoll</surname>
              <given-names>BC</given-names>
            </name>
            <name name-style="western">
              <surname>Pakhomov</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Melton</surname>
              <given-names>GB</given-names>
            </name>
          </person-group>
          <article-title>Natural language processing of prehospital emergency medical services trauma records allows for automated characterization of treatment appropriateness</article-title>
          <source>J Trauma Acute Care Surg</source>
          <year>2020</year>
          <month>05</month>
          <volume>88</volume>
          <issue>5</issue>
          <fpage>607</fpage>
          <lpage>14</lpage>
          <pub-id pub-id-type="doi">10.1097/TA.0000000000002598</pub-id>
          <pub-id pub-id-type="medline">31977990</pub-id>
          <pub-id pub-id-type="pii">01586154-202005000-00004</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Juhn</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Artificial intelligence approaches using natural language processing to advance EHR-based clinical research</article-title>
          <source>J Allergy Clin Immunol</source>
          <year>2020</year>
          <month>02</month>
          <volume>145</volume>
          <issue>2</issue>
          <fpage>463</fpage>
          <lpage>9</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/31883846"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jaci.2019.12.897</pub-id>
          <pub-id pub-id-type="medline">31883846</pub-id>
          <pub-id pub-id-type="pii">S0091-6749(19)32604-1</pub-id>
          <pub-id pub-id-type="pmcid">PMC7771189</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Inoue</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Kunitoh</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Sekine</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Sumi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Tokuuye</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Saijo</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Radiation pneumonitis in lung cancer patients: a retrospective study of risk factors and the long-term prognosis</article-title>
          <source>Int J Radiat Oncol Biol Phys</source>
          <year>2001</year>
          <month>03</month>
          <day>01</day>
          <volume>49</volume>
          <issue>3</issue>
          <fpage>649</fpage>
          <lpage>55</lpage>
          <pub-id pub-id-type="doi">10.1016/s0360-3016(00)00783-5</pub-id>
          <pub-id pub-id-type="medline">11172945</pub-id>
          <pub-id pub-id-type="pii">S0360-3016(00)00783-5</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chan</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Beers</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Yau</surname>
              <given-names>AA</given-names>
            </name>
            <name name-style="western">
              <surname>Chauhan</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Duffy</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Chaudhary</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Debnath</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Saha</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Pattharanitima</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Cho</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kotanko</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Federman</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Coca</surname>
              <given-names>SG</given-names>
            </name>
            <name name-style="western">
              <surname>Van Vleck</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Nadkarni</surname>
              <given-names>GN</given-names>
            </name>
          </person-group>
          <article-title>Natural language processing of electronic health records is superior to billing codes to identify symptom burden in hemodialysis patients</article-title>
          <source>Kidney Int</source>
          <year>2020</year>
          <month>02</month>
          <volume>97</volume>
          <issue>2</issue>
          <fpage>383</fpage>
          <lpage>92</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/31883805"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.kint.2019.10.023</pub-id>
          <pub-id pub-id-type="medline">31883805</pub-id>
          <pub-id pub-id-type="pii">S0085-2538(19)31116-0</pub-id>
          <pub-id pub-id-type="pmcid">PMC7001114</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kaur</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Sohn</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Wi</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Ryu</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Park</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Bachman</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Kita</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Croghan</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Castro-Rodriguez</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Voge</surname>
              <given-names>GA</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Juhn</surname>
              <given-names>YJ</given-names>
            </name>
          </person-group>
          <article-title>Automated chart review utilizing natural language processing algorithm for asthma predictive index</article-title>
          <source>BMC Pulm Med</source>
          <year>2018</year>
          <month>02</month>
          <day>13</day>
          <volume>18</volume>
          <issue>1</issue>
          <fpage>34</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcpulmmed.biomedcentral.com/articles/10.1186/s12890-018-0593-9"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12890-018-0593-9</pub-id>
          <pub-id pub-id-type="medline">29439692</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12890-018-0593-9</pub-id>
          <pub-id pub-id-type="pmcid">PMC5812028</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lindvall</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Forsyth</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Barzilay</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Tulsky</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Natural language processing: an opportunity to make chart data come alive in palliative care research (FR481A)</article-title>
          <source>J Pain Symptom Manag</source>
          <year>2017</year>
          <month>02</month>
          <day>1</day>
          <volume>53</volume>
          <issue>2</issue>
          <fpage>385</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1016/J.JPAINSYMMAN.2016.12.164"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jpainsymman.2016.12.164</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Petch</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Batt</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Murray</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Mamdani</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Extracting clinical features from dictated ambulatory consult notes using a commercially available natural language processing tool: pilot, retrospective, cross-sectional validation study</article-title>
          <source>JMIR Med Inform</source>
          <year>2019</year>
          <month>11</month>
          <day>01</day>
          <volume>7</volume>
          <issue>4</issue>
          <fpage>e12575</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2019/4/e12575/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/12575</pub-id>
          <pub-id pub-id-type="medline">31682579</pub-id>
          <pub-id pub-id-type="pii">v7i4e12575</pub-id>
          <pub-id pub-id-type="pmcid">PMC6913750</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Senders</surname>
              <given-names>JT</given-names>
            </name>
            <name name-style="western">
              <surname>Cho</surname>
              <given-names>LD</given-names>
            </name>
            <name name-style="western">
              <surname>Calvachi</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>McNulty</surname>
              <given-names>JJ</given-names>
            </name>
            <name name-style="western">
              <surname>Ashby</surname>
              <given-names>JL</given-names>
            </name>
            <name name-style="western">
              <surname>Schulte</surname>
              <given-names>IS</given-names>
            </name>
            <name name-style="western">
              <surname>Almekkawi</surname>
              <given-names>AK</given-names>
            </name>
            <name name-style="western">
              <surname>Mehrtash</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Gormley</surname>
              <given-names>WB</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>TR</given-names>
            </name>
            <name name-style="western">
              <surname>Broekman</surname>
              <given-names>ML</given-names>
            </name>
            <name name-style="western">
              <surname>Arnaout</surname>
              <given-names>O</given-names>
            </name>
          </person-group>
          <article-title>Automating clinical chart review: an open-source natural language processing pipeline developed on free-text radiology reports from patients with glioblastoma</article-title>
          <source>JCO Clin Cancer Inform</source>
          <year>2020</year>
          <month>01</month>
          <volume>4</volume>
          <fpage>25</fpage>
          <lpage>34</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://ascopubs.org/doi/10.1200/CCI.19.00060?url_ver=Z39.88-2003&#38;rfr_id=ori:rid:crossref.org&#38;rfr_dat=cr_pub%3dpubmed"/>
          </comment>
          <pub-id pub-id-type="doi">10.1200/CCI.19.00060</pub-id>
          <pub-id pub-id-type="medline">31977252</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cao</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Stetson</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Hripcsak</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Assessing explicit error reporting in the narrative electronic medical record using keyword searching</article-title>
          <source>J Biomed Inform</source>
          <year>2003</year>
          <volume>36</volume>
          <issue>1-2</issue>
          <fpage>99</fpage>
          <lpage>105</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532046403000583"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/s1532-0464(03)00058-3</pub-id>
          <pub-id pub-id-type="medline">14552851</pub-id>
          <pub-id pub-id-type="pii">S1532046403000583</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
