<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMI</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Med Inform</journal-id>
      <journal-title>JMIR Medical Informatics</journal-title>
      <issn pub-type="epub">2291-9694</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v7i4e12575</article-id>
      <article-id pub-id-type="pmid">31682579</article-id>
      <article-id pub-id-type="doi">10.2196/12575</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Extracting Clinical Features From Dictated Ambulatory Consult Notes Using a Commercially Available Natural Language Processing Tool: Pilot, Retrospective, Cross-Sectional Validation Study</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Parra-Calderón</surname>
            <given-names>Carlos Luis</given-names>
          </name>
        </contrib>
        <contrib contrib-type="editor">
          <name>
            <surname>Lovis</surname>
            <given-names>Christian</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Yu</surname>
            <given-names>Bei</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Torii</surname>
            <given-names>Manabu</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Ferreira</surname>
            <given-names>Liliana</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Zheng</surname>
            <given-names>Shuai</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" corresp="yes" equal-contrib="yes">
          <name name-style="western">
            <surname>Petch</surname>
            <given-names>Jeremy</given-names>
          </name>
          <degrees>BA, MA, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <address>
            <institution>Centre for Data Science and Digital Health</institution>
            <institution>Hamilton Health Sciences</institution>
            <addr-line>293 Wellington St North</addr-line>
            <addr-line>Hamilton, ON, L8L 8E7</addr-line>
            <country>Canada</country>
            <phone>1 905 521 2100 ext 47579</phone>
            <email>jeremy.petch@utoronto.ca</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-1614-1046</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Batt</surname>
            <given-names>Jane</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <xref rid="aff4" ref-type="aff">4</xref>
          <xref rid="aff5" ref-type="aff">5</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-7015-189X</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Murray</surname>
            <given-names>Joshua</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff6" ref-type="aff">6</xref>
          <xref rid="aff7" ref-type="aff">7</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-9233-4934</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Mamdani</surname>
            <given-names>Muhammad</given-names>
          </name>
          <degrees>PharmD, MA, MPH</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff6" ref-type="aff">6</xref>
          <xref rid="aff8" ref-type="aff">8</xref>
          <xref rid="aff9" ref-type="aff">9</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-5199-6344</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Institute of Health Policy, Management and Evaluation</institution>
        <institution>Dalla Lana School of Public Health</institution>
        <institution>University of Toronto</institution>
        <addr-line>Toronto, ON</addr-line>
        <country>Canada</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Centre for Data Science and Digital Health</institution>
        <institution>Hamilton Health Sciences</institution>
        <addr-line>Hamilton, ON</addr-line>
        <country>Canada</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Division of Respirology</institution>
        <institution>Department of Medicine</institution>
        <institution>University of Toronto</institution>
        <addr-line>Toronto, ON</addr-line>
        <country>Canada</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>Keenan Research Centre for Biomedical Science</institution>
        <institution>St. Michael's Hospital</institution>
        <addr-line>Toronto, ON</addr-line>
        <country>Canada</country>
      </aff>
      <aff id="aff5">
        <label>5</label>
        <institution>Department of Medicine</institution>
        <institution>St. Michael's Hospital</institution>
        <addr-line>Toronto, ON</addr-line>
        <country>Canada</country>
      </aff>
      <aff id="aff6">
        <label>6</label>
        <institution>Li Ka Shing Centre for Healthcare Analytics Research and Training</institution>
        <institution>St. Michael's Hospital</institution>
        <addr-line>Toronto, ON</addr-line>
        <country>Canada</country>
      </aff>
      <aff id="aff7">
        <label>7</label>
        <institution>Department of Statistical Sciences</institution>
        <institution>Faculty of Arts and Sciences</institution>
        <institution>University of Toronto</institution>
        <addr-line>Toronto, ON</addr-line>
        <country>Canada</country>
      </aff>
      <aff id="aff8">
        <label>8</label>
        <institution>Leslie Dan Faculty of Pharmacy</institution>
        <institution>University of Toronto</institution>
        <addr-line>Toronto, ON</addr-line>
        <country>Canada</country>
      </aff>
      <aff id="aff9">
        <label>9</label>
        <institution>Department of Medicine</institution>
        <institution>Faculty of Medicine</institution>
        <institution>University of Toronto</institution>
        <addr-line>Toronto, ON</addr-line>
        <country>Canada</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Jeremy Petch <email>jeremy.petch@utoronto.ca</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <season>Oct-Dec</season>
        <year>2019</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>1</day>
        <month>11</month>
        <year>2019</year>
      </pub-date>
      <volume>7</volume>
      <issue>4</issue>
      <elocation-id>e12575</elocation-id>
      <history>
        <date date-type="received">
          <day>22</day>
          <month>10</month>
          <year>2018</year>
        </date>
        <date date-type="rev-request">
          <day>26</day>
          <month>1</month>
          <year>2019</year>
        </date>
        <date date-type="rev-recd">
          <day>12</day>
          <month>5</month>
          <year>2019</year>
        </date>
        <date date-type="accepted">
          <day>29</day>
          <month>8</month>
          <year>2019</year>
        </date>
      </history>
      <copyright-statement>©Jeremy Petch, Jane Batt, Joshua Murray, Muhammad Mamdani. Originally published in JMIR Medical Informatics (http://medinform.jmir.org), 01.11.2019.</copyright-statement>
      <copyright-year>2019</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Informatics, is properly cited. The complete bibliographic information, a link to the original publication on http://medinform.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="http://medinform.jmir.org/2019/4/e12575/" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>The increasing adoption of electronic health records (EHRs) in clinical practice holds the promise of improving care and advancing research by serving as a rich source of data, but most EHRs allow clinicians to enter data in a text format without much structure. Natural language processing (NLP) may reduce reliance on manual abstraction of these text data by extracting clinical features directly from unstructured clinical digital text data and converting them into structured data.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>This study aimed to assess the performance of a commercially available NLP tool for extracting clinical features from free-text consult notes.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>We conducted a pilot, retrospective, cross-sectional study of the accuracy of NLP from dictated consult notes from our tuberculosis clinic with manual chart abstraction as the reference standard. Consult notes for 130 patients were extracted and processed using NLP. We extracted 15 clinical features from these consult notes and grouped them a priori into categories of simple, moderate, and complex for analysis.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>For the primary outcome of overall accuracy, NLP performed best for features classified as simple, achieving an overall accuracy of 96% (95% CI 94.3-97.6). Performance was slightly lower for features of moderate clinical and linguistic complexity at 93% (95% CI 91.1-94.4), and lowest for complex features at 91% (95% CI 87.3-93.1).</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>The findings of this study support the use of NLP for extracting clinical features from dictated consult notes in the setting of a tuberculosis clinic. Further research is needed to fully establish the validity of NLP for this and other purposes.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>natural language processing</kwd>
        <kwd>electronic health record</kwd>
        <kwd>tuberculosis</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <sec>
        <title>Background</title>
        <p>In recent years, the use of electronic health records (EHRs) in office-based clinical practices in the United States has more than doubled, from approximately 40% in 2008 to nearly 90% in 2015 [<xref ref-type="bibr" rid="ref1">1</xref>]. This rise has been even sharper in hospitals, where EHR adoption has increased from about 10% in 2008 to nearly 85% in 2015 [<xref ref-type="bibr" rid="ref2">2</xref>]. The increasing adoption of EHRs in clinical practice holds the promise of improving care and advancing research by serving as a rich source of data. However, gleaning useful information from EHR data can be challenging, and the use of such data for research purposes varies considerably across jurisdictions [<xref ref-type="bibr" rid="ref3">3</xref>].</p>
        <p>One challenge relates to EHRs allowing clinicians to enter data in text format without much structure. Although this enhances clinical usability, it often requires costly and time-consuming manual chart abstraction processes to extract useful information in a structured manner. These challenges have sparked an increasing interest in the potential for natural language processing (NLP) approaches to process unstructured clinical digital text data, extract clinical features, and convert them into structured data.</p>
        <p>Although NLP approaches for processing radiological reports are now well established [<xref ref-type="bibr" rid="ref4">4</xref>], the practice of using NLP for processing more general clinical documentation, especially consult notes, is still developing. Research to date has explored several applications of NLP to general clinical documentation, including identification of breast cancer recurrence [<xref ref-type="bibr" rid="ref5">5</xref>], social isolation [<xref ref-type="bibr" rid="ref6">6</xref>], falls risk [<xref ref-type="bibr" rid="ref7">7</xref>], depression [<xref ref-type="bibr" rid="ref8">8</xref>], homelessness [<xref ref-type="bibr" rid="ref9">9</xref>], intraductal papillary mucinous neoplasms [<xref ref-type="bibr" rid="ref10">10</xref>], and new clinically relevant information for organ transplant patients [<xref ref-type="bibr" rid="ref11">11</xref>]. One common feature of much of the research to date is that studies have tended to leverage open-source and academic tools for NLP. Although these tools can be highly effective, most are available as libraries for programing languages such as Python and R, which can pose a barrier for health care organizations that lack robust digital capacity or academic partnerships. However, there are an increasing number of commercially available NLP tools, such as Linguimatics I2E and Google Cloud’s AutoML, that promise to make NLP significantly more accessible for general users, but to date, there have been relatively fewer studies that have evaluated the validity of these tools for clinical feature extraction [<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref7">7</xref>,<xref ref-type="bibr" rid="ref12">12</xref>].</p>
      </sec>
      <sec>
        <title>Objective</title>
        <p>We conducted a pilot study to examine the accuracy of a commercially available NLP tool relative to manual chart abstraction in capturing useful information from free-text consult notes in an outpatient tuberculosis (TB) clinic.</p>
      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Study Setting</title>
        <p>We conducted a pilot, retrospective, cross-sectional study of feature extraction accuracy using NLP, with manual chart abstraction as the reference standard. The study setting was St. Michael’s Hospital, which is a 450-bed urban academic hospital affiliated with the University of Toronto. The St. Michael’s TB program serves as a tertiary referral center for patients with active TB and latent TB infection, managing patients in both inpatient and outpatient settings. The program is staffed by a rotating roster of 8 physicians (6 respirologists and 2 infectious disease physicians) and 1 TB nurse practitioner and has a volume of approximately 2000 outpatient encounters annually. This study was approved by the St. Michael’s Hospital Research Ethics Board and conducted in accordance with its policies.</p>
      </sec>
      <sec>
        <title>Natural Language Processing Approach</title>
        <p>We conducted our NLP analysis using a commercial NLP engine (Pentavere’s DARWEN), which integrates 3 primary approaches to extract clinical features: (1) manually prepared natural language extraction rules that describe the general syntax and lexicon of each feature (both custom and internationally recognized ontologies such as Medical Subject Headings and Systematized Nomenclature of Medicine-Clinical Terms are utilized as an initial source of synonyms for common clinical terms), (2) machine-learned inferred rules that are designed to complement and reduce the extraction error rate of the manually prepared rules (the usage of machine learning in DARWEN is directed to improve the quality of the clinical natural language extraction rather than to predict or infer clinical features based on other features, as is the case with many competing systems), and (3) heuristic rules that encapsulate overarching clinical knowledge that must be respected when considering the clinical features holistically. This workflow is illustrated in <xref rid="figure1" ref-type="fig">Figure 1</xref>.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Natural language processing (NLP) workflow using the DARWEN tool. PRP: pronoun; VB: verb; RB: adverb; JJ: adjective; CC: coordinating conjunction; DT: determiner; NN: noun; IN: preposition; TB: tuberculosis; TST: Tuberculin Skin Test.</p>
          </caption>
          <graphic xlink:href="medinform_v7i4e12575_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <p>We followed the standard process for employing DARWEN, which involves tuning, testing, and retuning against a reference standard, together with clinician consultation to resolve any semantic issues as well as to develop the heuristic rules. Tuning refers to the process of refining NLP extraction rules based on manual analysis of text and is an essential step to successfully account for the variability in terminology and documentation structure between clinicians. Generating rules during the tuning process is an iterative, feature-by-feature, semisupervised process. First, we focused on recognizing the key entities associated with any feature, such as comorbidities. Given the low volume of data in the training set, we started with recurrent neural network-based named entity recognition (NER) models, which were pretrained for recognizing drugs, diagnosis, medical risk factors, and adverse drug reactions on Pentavere’s proprietary clinical dataset (Pentavere’s proprietary corpus includes over 100,000 patients, with an average of 50 clinical notes per patient); discussed the match results with the clinician; and supplemented the NER model with heuristics to accommodate any discrepancies. For clinical features not appropriate for NER models, we employed a purely heuristic approach. For example, for a feature such as smoking status, we developed an initial set of rules to cover 3 straightforward cases: explicit mention of nonsmoker (eg, “She never smokes”), explicit mention of former smoker (eg, “she is a former light smoker”), and qualified mention of former smoker (eg, “She is a smoker who gave up 2 years ago”). Although these captured many cases of smoking found in the text, the tuning process revealed many more subtle cases that require further development of rules, such as a smoker who quit and then started again, handling of indeterminant language (eg, “She has a 20 pack year smoking history” in which it is not clear whether the patient still smokes or has quit), oblique mentions (eg, “She uses marijuana”), and second-hand smoker (eg, “Her former roommate was a smoker, but she was not.”) In this case, we developed rules to label token sequences (spans) into each of the different cases of smoker, former smoker, and nonsmoker. These rules are a combination of syntactic and lexical patterns, sometimes manually specified and sometimes induced from the data itself.</p>
        <p>We then turned our attention to modeling the relationships between entities using a constituent parse tree kernel–based induction semisupervised machine learning technique, Pentavere’s proprietary algorithm inspired by the Dual Iterative Pattern Relation Expansion algorithm [<xref ref-type="bibr" rid="ref13">13</xref>]. For training data, the algorithm uses a few starting phrases or sentences that provide a valid relationship and a few that provide an invalid relationship. Given some initial examples of related entities, the algorithm finds generalizations of parse trees that define those known relationships. These syntactic rules/patterns were then applied to find other entities that appear to be in similar relationships. We also leveraged features of the tool that support several contextual states, including polarity (negation), certainty/uncertainty, hypothesis (if… then…), historical context (history of…), and experiencer (patient and family member). This contextualization uses constituent and dependency parse trees to describe different types of relationships between tokens in text and thus determine the scope of the context, for example, to restrict a context to only apply to entities contained in specific sub (constituent) trees of the context and/or require a specific dependency relationship between the entities in context. For a case such as, “She has no apparent rash causing her pruritus,” this approach recognizes that rash is negated but pruritus is not negated.</p>
      </sec>
      <sec>
        <title>Sampling Approach</title>
        <p>To create our corpus, we randomly sampled 130 patient records from a total pool of 351 records from our hospital’s outpatient TB clinic without exclusion and extracted their consult notes from their EHR. Consult notes for all outpatient encounters in the TB clinic are dictated by the attending physician or resident, followed by review and electronic sign-off by the attending physician. Dictations are free format, with no standardized template. They contain detailed clinical information about patients’ demographics, diagnosis, treatment course (including medications), and progress. Given that these notes contain personal health information, we are not able to share the corpus, but we have included synthetic samples of both assessment and follow-up notes in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>, which are representative of the corpus.</p>
        <p>We randomly divided our sample into 3 parts to support the tuning process described above, a tuning sample (n=30), a first-round testing/retuning sample (n=50), and a final testing sample (n=50). A single patient record allotted to the final testing sample contained corrupted data, reducing the final testing sample size to 49.</p>
      </sec>
      <sec>
        <title>Feature Identification</title>
        <p>The following features were selected for extraction: country of birth, date of immigration to Canada, HIV status, known TB exposure, previous TB, smoking status, diagnosis, method of diagnosis, TB sensitivities, sputum culture conversion date, drug treatments, adverse drug reactions, medical risk factors for TB acquisition, social risk factors for TB acquisition, and disease extent (<xref ref-type="table" rid="table1">Table 1</xref>).</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Feature categorization based on a priori assessment of clinical and linguistic complexity.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="370"/>
            <col width="200"/>
            <col width="400"/>
            <thead>
              <tr valign="top">
                <td colspan="2">Feature complexity and feature</td>
                <td>Type</td>
                <td>Examples</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="2">
                  <bold>Simple</bold>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Country of birth</td>
                <td>Country</td>
                <td>India; Indonesia</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Date of immigration</td>
                <td>Date</td>
                <td>30/06/2013</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Smoking status</td>
                <td>Categorical</td>
                <td>Current smoker; former smoker</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Drug treatment</td>
                <td>Text mapped to drug list</td>
                <td>Isoniazid; rifampin</td>
              </tr>
              <tr valign="top">
                <td colspan="2">
                  <bold>Moderate</bold>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>HIV status</td>
                <td>Binary</td>
                <td>Positive/negative</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Known TB<sup>a</sup> exposure</td>
                <td>Binary</td>
                <td>Yes/no</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Previous TB</td>
                <td>Binary</td>
                <td>Yes/no</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Method of diagnosis</td>
                <td>Categorical</td>
                <td>Culture positive; polymerase chain reaction positive</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>TB sensitivities</td>
                <td>Categorical</td>
                <td>Fully sensitive; isoniazid resistant</td>
              </tr>
              <tr valign="top">
                <td colspan="2">
                  <bold>Complex</bold>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Diagnosis</td>
                <td>Categorical</td>
                <td>Active TB; latent TB infection</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Sputum conversion date</td>
                <td>Date</td>
                <td>22/07/2016</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Adverse drug reactions</td>
                <td>Categorical</td>
                <td>Peripheral neuropathy; rash</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Medical risk factors</td>
                <td>Categorical</td>
                <td>Chemotherapy; renal failure</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Social risk factors</td>
                <td>Categorical</td>
                <td>Refugee camp resident; jail inmate</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Disease extent</td>
                <td>Categorical</td>
                <td>Pulmonary acid fast bacilli smear positive; disseminated</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>TB: tuberculosis.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>For each feature where a patient could have multiple observations, a series of dichotomous indicator features were created. For example, for drug treatment, patients could be on multiple medications, so dichotomous features were created for each relevant medication.</p>
        <p>For analysis, we pooled these features into 3 categories—simple, moderate, and complex—based on an a priori assessment by a clinical expert of the relative clinical and linguistic complexity of each feature, based upon their clinical judgment (<xref ref-type="table" rid="table1">Table 1</xref>). Complex features were typically those where NLP would have to go well beyond simply categorizing terms based on a reference dictionary but would instead have to successfully process rich language with significant clinical context. For example, adverse drug reactions are particularly challenging as we may see the mention of a <italic>rash</italic> in the text, but this does not determine whether there was in fact a rash or whether a rash was the result of an adverse drug reaction. To determine whether there was a rash, we have to be able to rule out cases with the physician dictating “no evidence of rash,” patient complaining of rash but not diagnosed as such by the physician, and the physician dictating that she discussed rashes as possible side effects of the medication. Once it has been determined that a rash is present, we must first determine whether a rash is in fact a possible side effect of a drug the patient had been prescribed and then identify if the rash started when the drug was administered, which unless explicitly dictated, requires the solution to process the patient encounters longitudinally.</p>
        <p>The reference standard was created by manually extracting features from patient records using a standardized data extraction form by a trained chart reviewer to serve as the <italic>reference standard analysis</italic>. One of the coauthors (JB) trained both the chart reviewer and the NLP engineer on how to perform chart abstraction to ensure the same clinical criteria would be used by both. This coauthor (JB) performed arbitration in cases of disagreement between the chart abstractor and the NLP tool’s output. Arbitrated results were used to retune the model on the training dataset before the final testing phase.</p>
      </sec>
      <sec>
        <title>Statistical Analysis</title>
        <p>The primary outcome of our study was overall accuracy, defined as the number of correctly classified observations divided by the total number of observations [<xref ref-type="bibr" rid="ref14">14</xref>]. Secondary outcomes were sensitivity (recall), specificity, positive predictive value (PPV; precision), and negative predictive value (NPV) [<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref16">16</xref>]. NLP-abstracted data were treated as the <italic>index analysis</italic>, with manual chart review acting as the <italic>reference standard analysis</italic>.</p>
        <p>Analysis was divided into 2 stages. The first stage was conducted after a single round of tuning of the NLP algorithms (n=50). The results of this stage were used to retune the semantic and heuristic rules used by the NLP tool to improve accuracy. The final analysis stage was conducted on the remaining records (n=49).</p>
        <p>For the primary outcome, within each feature category, we calculated the accuracy and a 95% CI using standard methods for continuous features and proportions [<xref ref-type="bibr" rid="ref17">17</xref>]. For secondary outcomes, we calculated the average and standard deviation within each category. For example, for the simple category, we calculated secondary outcomes for each feature within the category, averaged them, and calculated the standard deviation. This is a way of illustrating the average sensitivity, specificity, PPV and NPV, and spread across all classes of a multicategorical feature. All analyses were conducted using R (v 3.3.0).</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Overview</title>
        <p>The study sample of 129 subjects included 71 females (55.0%, 71/129) with a mean age of 36.51 years and 58 males (45%) with a mean age of 46.74 years. Consult notes from 9 clinicians (8 physicians and 1 nurse practitioner) were included in the sample. A total of 138 points of discrepancy between the NLP process and the reference standard chart abstraction were identified.</p>
      </sec>
      <sec>
        <title>Natural Language Processing Performance</title>
        <p>For the primary outcome (<xref ref-type="table" rid="table2">Table 2</xref>), NLP performed best for features classified as simple, achieving an overall accuracy of 96% (95% CI 94.3-97.6). Performance was slightly lower for features of moderate clinical and linguistic complexity at 93% (95% CI 91.1-94.4) and lowest for complex features at 91% (95% CI 87.3-93.1).</p>
        <p>For secondary outcomes (<xref ref-type="table" rid="table2">Table 2</xref>), NLP achieved a sensitivity of 94% (SD 7.7) for simple, 60% (SD 38.6) for moderate, and 74% (SD 45.7) for complex features and PPV of 96% (SD 6.4) for simple, 70% (SD 33.7) for moderate, and 54% (SD 37.4) for complex features. The relatively low sensitivity and PPV for moderate and complex features is in contrast to its specificity of 99% (SD 0.5) for simple, 94% (SD 5.0) for moderate, and 89% (SD 8.3) for complex features and NPV of 99% (SD 1.7) for simple, 96% (SD 6.6) for moderate, and 98% (SD 2.9) for complex features.</p>
        <p>Unsurprisingly, we saw considerable variation in NLP’s performance at the clinical feature level (<xref ref-type="table" rid="table3">Table 3</xref>). NLP performed extremely well for detecting drug prescriptions, achieving 100% for all primary and secondary outcomes for moxifloxacin, rifampin, ethambutol, and isoniazid. In contrast, NLP did not perform well at the feature level when measuring disease extent, with a sensitivity of only 25% for pulmonary acid fast bacilli (AFB) positive and 0% for extra pulmonary cases because of a very low number of these cases in our sample (4 pulmonary AFB-positive cases and 2 extrapulmonary cases).</p>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Primary and secondary outcomes for natural language processing (index analysis) compared with manual chart review (reference standard analysis).</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="150"/>
            <col width="190"/>
            <col width="170"/>
            <col width="170"/>
            <col width="150"/>
            <col width="170"/>
            <thead>
              <tr valign="top">
                <td>Feature complexity</td>
                <td>Primary outcome, overall accuracy (95% CI)</td>
                <td colspan="4">Secondary outcomes</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Sensitivity/recall (SD)</td>
                <td>Specificity (SD)</td>
                <td>Positive predictive value/precision (SD)</td>
                <td>Negative predictive value (SD)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Simple</td>
                <td>96.3 (94.3-97.6)</td>
                <td>93.8 (7.7)</td>
                <td>99.7 (0.5)</td>
                <td>96.4 (6.4)</td>
                <td>99.0 (1.7)</td>
              </tr>
              <tr valign="top">
                <td>Moderate</td>
                <td>92.9 (91.1-94.4)</td>
                <td>60.2 (38.6)</td>
                <td>94.2 (5.0)</td>
                <td>70.2 (33.7)</td>
                <td>95.6 (6.6)</td>
              </tr>
              <tr valign="top">
                <td>Complex</td>
                <td>90.6 (87.3-93.1)</td>
                <td>73.8 (45.7)</td>
                <td>89.2 (8.3)</td>
                <td>53.6 (37.4)</td>
                <td>98.4 (2.9)</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Primary and secondary outcomes for natural language processing (index analysis) compared with manual chart review (reference standard analysis) at the clinical feature level.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="30"/>
            <col width="170"/>
            <col width="180"/>
            <col width="160"/>
            <col width="130"/>
            <col width="150"/>
            <col width="150"/>
            <thead>
              <tr valign="top">
                <td colspan="3">Feature</td>
                <td>Primary outcome, overall accuracy (95% CI)</td>
                <td colspan="4">Secondary outcomes<sup>a</sup></td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Sensitivity/recall (SD)</td>
                <td>Specificity (SD)</td>
                <td>Positive predictive value/precision (SD)</td>
                <td>Negative predictive value (SD)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="8">
                  <bold>Simple features</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Country of birth</td>
                <td>0.92 (0.80-0.98)</td>
                <td>0.88 (0.32)</td>
                <td>0.99 (0.01)</td>
                <td>0.97 (0.11)</td>
                <td>0.99 (0.01)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Year of immigration</td>
                <td>0.90 (0.78-0.97)</td>
                <td>0.89 (0.29)</td>
                <td>0.99 (0.02)</td>
                <td>0.98 (0.08)</td>
                <td>0.99 (0.01)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Smoking status</td>
                <td>0.94 (0.83-0.99)</td>
                <td>0.92 (0.08)</td>
                <td>0.98 (0.03)</td>
                <td>0.85 (0.30)</td>
                <td>0.97 (0.02)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Sputum conversion date</td>
                <td>0.98 (0.89-0.99)</td>
                <td>0.80 (0.45)</td>
                <td>0.99 (0.01)</td>
                <td>0.99 (0.01)</td>
                <td>0.99 (0.01)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Pyrazinamide</td>
                <td>0.96 (0.86-0.99)</td>
                <td>1.00</td>
                <td>0.85</td>
                <td>0.95</td>
                <td>1.00</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Moxifloxacin</td>
                <td>1.00 (0.93-1.00)</td>
                <td>1.00</td>
                <td>1.00</td>
                <td>1.00</td>
                <td>1.00</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Vitamin B6</td>
                <td>0.92 (0.80-0.98)</td>
                <td>1.00</td>
                <td>0.86</td>
                <td>0.84</td>
                <td>1.00</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Rifampin</td>
                <td>1.00 (0.93-1.00)</td>
                <td>1.00</td>
                <td>1.00</td>
                <td>1.00</td>
                <td>1.00</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Ethambutol</td>
                <td>1.00 (0.93-1.00)</td>
                <td>1.00</td>
                <td>1.00</td>
                <td>1.00</td>
                <td>1.00</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Isoniazid</td>
                <td>1.00 (0.93-1.00)</td>
                <td>1.00</td>
                <td>1.00</td>
                <td>1.00</td>
                <td>1.00</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Levofloxacin</td>
                <td>0.98 (0.89-0.99)</td>
                <td>N/A<sup>b</sup></td>
                <td>0.98</td>
                <td>N/A</td>
                <td>N/A</td>
              </tr>
              <tr valign="top">
                <td colspan="8">
                  <bold>Moderate features</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">HIV status</td>
                <td>0.94 (0.83-0.99)</td>
                <td>0.94</td>
                <td>0.94</td>
                <td>0.89</td>
                <td>0.97</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">TB<sup>c</sup> contact</td>
                <td>0.82 (0.68-0.91)</td>
                <td>0.80</td>
                <td>0.82</td>
                <td>0.67</td>
                <td>0.90</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Old TB</td>
                <td>0.94 (0.83-0.99)</td>
                <td>0.71</td>
                <td>0.98</td>
                <td>0.83</td>
                <td>0.95</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Culture positive</td>
                <td>0.88 (0.75-0.95)</td>
                <td>0.33</td>
                <td>1.00</td>
                <td>1.00</td>
                <td>0.87</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Polymerase chain reaction positive</td>
                <td>1.00 (0.93-1.00)</td>
                <td>1.00</td>
                <td>1.00</td>
                <td>1.00</td>
                <td>1.00</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Clinical diagnosis</td>
                <td>1.00 (0.93-1.00)</td>
                <td>1.00</td>
                <td>1.00</td>
                <td>1.00</td>
                <td>1.00</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Drug sensitivity</td>
                <td>0.92 (0.80-0.98)</td>
                <td>0.81 (0.27)</td>
                <td>0.97 (0.04)</td>
                <td>0.73 (0.25)</td>
                <td>0.91 (0.14)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Corticosteroids</td>
                <td>0.98 (0.89-0.99)</td>
                <td>N/A</td>
                <td>0.98</td>
                <td>N/A</td>
                <td>N/A</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Chemotherapy</td>
                <td>0.94 (0.83-0.99)</td>
                <td>0.50</td>
                <td>0.96</td>
                <td>0.33</td>
                <td>0.98</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Other immunosuppressive drugs</td>
                <td>0.76 (0.61-0.87)</td>
                <td>0.08</td>
                <td>0.97</td>
                <td>0.50</td>
                <td>0.77</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Cancer</td>
                <td>0.92 (0.80-0.98)</td>
                <td>1.00</td>
                <td>0.91</td>
                <td>0.33</td>
                <td>1.00</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Diabetes</td>
                <td>0.98 (0.89-0.99)</td>
                <td>0.86</td>
                <td>1.00</td>
                <td>1.00</td>
                <td>0.98</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Malnutrition</td>
                <td>0.94 (0.83-0.99)</td>
                <td>0.00</td>
                <td>0.98</td>
                <td>0.00</td>
                <td>0.96</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Other immunosuppressive conditions</td>
                <td>0.82 (0.68-0.91)</td>
                <td>0.10</td>
                <td>1.00</td>
                <td>1.00</td>
                <td>0.81</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Marginalized</td>
                <td>0.96 (0.86-0.99)</td>
                <td>0.66 (0.57)</td>
                <td>0.93 (0.12)</td>
                <td>0.99 (0.02)</td>
                <td>0.91 (0.14)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Health care facility</td>
                <td>0.90 (0.78-0.97)</td>
                <td>0.38 (0.48)</td>
                <td>0.95 (0.08)</td>
                <td>0.95 (0.08)</td>
                <td>0.97 (0.03)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">
                  <bold>Pulmonary</bold>
                  <bold>acid fast bacilli</bold>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Positive</td>
                <td>0.92 (0.80-0.98)</td>
                <td>0.25</td>
                <td>0.98</td>
                <td>0.50</td>
                <td>0.93</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Negative</td>
                <td>0.96 (0.86-0.99)</td>
                <td>1.00</td>
                <td>0.96</td>
                <td>0.67</td>
                <td>1.00</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Extrapulmonary (other than lymphadenitis)</td>
                <td>0.88 (0.75-0.96)</td>
                <td>0.00</td>
                <td>0.96</td>
                <td>0.00</td>
                <td>0.91</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Lymphadenitis</td>
                <td>0.94 (0.83-0.99)</td>
                <td>N/A</td>
                <td>0.94</td>
                <td>N/A</td>
                <td>N/A</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Disseminated</td>
                <td>0.96 (0.86-0.99)</td>
                <td>0.00</td>
                <td>1.00</td>
                <td>N/A</td>
                <td>0.96</td>
              </tr>
              <tr valign="top">
                <td colspan="8">
                  <bold>Complex features</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Active TB disease</td>
                <td>1.00 (0.93-1.00)</td>
                <td>1.00</td>
                <td>1.00</td>
                <td>1.00</td>
                <td>1.00</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Latent TB infection</td>
                <td>0.84 (0.70-0.93)</td>
                <td>0.90</td>
                <td>0.79</td>
                <td>0.76</td>
                <td>0.92</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Pulmonary nontuberculous mycobacteria</td>
                <td>0.88 (0.75-0.95)</td>
                <td>1.00</td>
                <td>0.87</td>
                <td>0.25</td>
                <td>1.00</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">
                  <bold>Adverse drug reaction</bold>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Gastrointestinal</td>
                <td>0.84 (0.70-0.93)</td>
                <td>1.00</td>
                <td>0.76</td>
                <td>0.65</td>
                <td>1.00</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Peripheral neuropathy</td>
                <td>0.96 (0.86-0.99)</td>
                <td>1.00</td>
                <td>0.95</td>
                <td>0.78</td>
                <td>1.00</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Rash</td>
                <td>0.90 (0.78-0.97)</td>
                <td>1.00</td>
                <td>0.89</td>
                <td>0.50</td>
                <td>1.00</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Other</td>
                <td>0.94 (0.83-0.99)</td>
                <td>0.00</td>
                <td>0.98</td>
                <td>0.00</td>
                <td>0.96</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Ocular toxicity</td>
                <td>0.90 (0.75-0.97)</td>
                <td>0.00</td>
                <td>0.92</td>
                <td>0.00</td>
                <td>0.98</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table3fn1">
              <p><sup>a</sup>Values within parenthesis are standard deviation values.</p>
            </fn>
            <fn id="table3fn2">
              <p><sup>b</sup>N/A: not applicable.</p>
            </fn>
            <fn id="table3fn3">
              <p><sup>c</sup>TB: tuberculosis.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Natural Language Processing Performance Adjusted for Adjudication</title>
        <p>To understand whether NLP’s relatively low sensitivity and PPV for moderate and complex features might be driven by errors in the manual chart review, rather than errors in NLP, we conducted a post hoc analysis in which all 138 points of discrepancy between the reference standard and index analysis were arbitrated by a clinical expert. The expert found the results to be in favor of NLP in 51.4% (71/138) of cases and chart review in 45.6% (63/138) of cases and found that both were incorrect in 2.8% (4/138) of cases.</p>
        <p>After adjusting for the results of adjudication, results for our primary outcome of overall accuracy increased modestly to 98% (95% CI 96.1-98.7) for simple, 96% (95% CI 94.8-97.3) for moderate, and 94% (95% CI 91.3-96.1) for complex features. The sensitivity increased to 78% (SD 25.0) for moderate and 86% (SD 35.0) for complex features, and PPV increased to 93% (SD 14.7) for moderate and 70% (SD 34.2) for complex features (<xref ref-type="table" rid="table4">Table 4</xref>).</p>
        <p>At the feature level (<xref ref-type="table" rid="table5">Table 5</xref>), adjustment for adjudication resulted in several dramatic improvements, particularly in the area of immunosuppressive drugs and conditions. For example, PPV for both cancer and chemotherapy was only 33% before adjudication but increased to 100% following adjudication. Similarly, for other immunosuppressive drugs, sensitivity was only 8% and PPV was only 50% initially, but it increased to 67% and 100%, respectively, after adjudication.</p>
        <table-wrap position="float" id="table4">
          <label>Table 4</label>
          <caption>
            <p>Primary and secondary outcomes for natural language processing compared with manual chart review, adjusted for results of adjudication.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="150"/>
            <col width="190"/>
            <col width="170"/>
            <col width="170"/>
            <col width="150"/>
            <col width="170"/>
            <thead>
              <tr valign="top">
                <td>Feature complexity</td>
                <td>Primary outcome, overall accuracy (95% CI)</td>
                <td colspan="4">Secondary outcomes</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Sensitivity/recall (SD)</td>
                <td>Specificity (SD)</td>
                <td>Positive predictive value/precision (SD)</td>
                <td>Negative predictive value (SD)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Simple</td>
                <td>97.8 (96.1-98.7)</td>
                <td>96.4 (5.4)</td>
                <td>99.8 (0.5)</td>
                <td>98.3 (4.5)</td>
                <td>99.2 (1.7)</td>
              </tr>
              <tr valign="top">
                <td>Moderate</td>
                <td>96.2 (94.8-97.3)</td>
                <td>78.2 (25.0)</td>
                <td>93.3 (4.7)</td>
                <td>92.7 (14.7)</td>
                <td>97.2 (3.2)</td>
              </tr>
              <tr valign="top">
                <td>Complex</td>
                <td>94.1 (91.3-96.1)</td>
                <td>86.3 (35.0)</td>
                <td>92.8 (8.2)</td>
                <td>70.5 (34.2)</td>
                <td> 98.7 (2.9)</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <table-wrap position="float" id="table5">
          <label>Table 5</label>
          <caption>
            <p>Primary and secondary outcomes for natural language processing compared with manual chart review, adjusted for results of adjudication at the clinical feature level.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="30"/>
            <col width="170"/>
            <col width="0"/>
            <col width="180"/>
            <col width="0"/>
            <col width="160"/>
            <col width="0"/>
            <col width="130"/>
            <col width="0"/>
            <col width="150"/>
            <col width="0"/>
            <col width="150"/>
            <thead>
              <tr valign="top">
                <td colspan="3">Feature</td>
                <td colspan="2">Primary outcome, overall accuracy (95% CI)</td>
                <td colspan="8">Secondary outcomes<sup>a</sup></td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">Sensitivity/recall (SD)</td>
                <td colspan="2">Specificity (SD)</td>
                <td colspan="2">Positive predictive value/precision (SD)</td>
                <td colspan="2">Negative predictive value (SD)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="13">
                  <bold>Simple features</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Country of birth</td>
                <td colspan="2">0.94 (0.83-0.99)</td>
                <td colspan="2">0.91 (0.28)</td>
                <td colspan="2">0.99 (0.01)</td>
                <td colspan="2">0.98 (0.10)</td>
                <td>0.99 (0.01)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Year of immigration</td>
                <td colspan="2">0.92 (0.80-0.98)</td>
                <td colspan="2">0.92 (0.23)</td>
                <td colspan="2">0.99 (0.02)</td>
                <td colspan="2">0.99 (0.06)</td>
                <td>0.99 (0.01)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Smoking status</td>
                <td colspan="2">0.94 (0.83-0.99)</td>
                <td colspan="2">0.92 (0.08)</td>
                <td colspan="2">0.98 (0.03)</td>
                <td colspan="2">0.85 (0.30)</td>
                <td>0.97 (0.02)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Sputum year</td>
                <td colspan="2">1.00 (0.93-1.00)</td>
                <td colspan="2">1.00</td>
                <td colspan="2">1.00</td>
                <td colspan="2">1.00</td>
                <td>1.00</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Pyrazinamide</td>
                <td colspan="2">0.96 (0.86-0.99)</td>
                <td colspan="2">1.00</td>
                <td colspan="2">0.85</td>
                <td colspan="2">0.95</td>
                <td>1.00</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Moxifloxacin</td>
                <td colspan="2">1.00 (0.93-1.00)</td>
                <td colspan="2">1.00</td>
                <td colspan="2">1.00</td>
                <td colspan="2">1.00</td>
                <td>1.00</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Vitamin B6</td>
                <td colspan="2">0.92 (0.80-0.98)</td>
                <td colspan="2">1.00</td>
                <td colspan="2">0.86</td>
                <td colspan="2">0.84</td>
                <td>1.00</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Rifampin</td>
                <td colspan="2">1.00 (0.93-1.00)</td>
                <td colspan="2">1.00</td>
                <td colspan="2">1.00</td>
                <td colspan="2">1.00</td>
                <td>1.00</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Ethambutol</td>
                <td colspan="2">1.00 (0.93-1.00)</td>
                <td colspan="2">1.00</td>
                <td colspan="2">1.00</td>
                <td colspan="2">1.00</td>
                <td>1.00</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Isoniazid</td>
                <td colspan="2">1.00 (0.93-1.00)</td>
                <td colspan="2">1.00</td>
                <td colspan="2">1.00</td>
                <td colspan="2">1.00</td>
                <td>1.00</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Levofloxacin</td>
                <td colspan="2">1.00 (0.93-1.00)</td>
                <td colspan="2">1.00</td>
                <td colspan="2">1.00</td>
                <td colspan="2">1.00</td>
                <td>1.00</td>
              </tr>
              <tr valign="top">
                <td colspan="13">
                  <bold>Moderate features</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">HIV status</td>
                <td colspan="2">0.98 (0.89-0.99)</td>
                <td colspan="2">0.95</td>
                <td colspan="2">1.00</td>
                <td colspan="2">1.00</td>
                <td>0.97</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">TB<sup>b</sup> contact</td>
                <td colspan="2">0.86 (0.73-0.94)</td>
                <td colspan="2">0.92</td>
                <td colspan="2">0.83</td>
                <td colspan="2">0.67</td>
                <td>0.97</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Old TB</td>
                <td colspan="2">0.96 (0.86-0.99)</td>
                <td colspan="2">0.75</td>
                <td colspan="2">1.00</td>
                <td colspan="2">1.00</td>
                <td>0.95</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Culture positive</td>
                <td colspan="2">0.88 (0.75-0.95)</td>
                <td colspan="2">0.33</td>
                <td colspan="2">1.00</td>
                <td colspan="2">1.00</td>
                <td>0.87</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Polymerase chain reaction positive</td>
                <td colspan="2">1.00 (0.93-1.00)</td>
                <td colspan="2">1.00</td>
                <td colspan="2">1.00</td>
                <td colspan="2">1.00</td>
                <td>1.00</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Clinical diagnosis</td>
                <td colspan="2">1.00 (0.93-1.00)</td>
                <td colspan="2">1.00</td>
                <td colspan="2">1.00</td>
                <td colspan="2">1.00</td>
                <td>1.00</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Drug sensitivity</td>
                <td colspan="2">0.96 (0.86-0.99)</td>
                <td colspan="2">0.98 (0.03)</td>
                <td colspan="2">0.99 (0.01)</td>
                <td colspan="2">0.80 (0.26)</td>
                <td>0.94 (0.10)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Corticosteroids</td>
                <td colspan="2">1.00 (0.93, 1.00)</td>
                <td colspan="2">1.00</td>
                <td colspan="2">1.00</td>
                <td colspan="2">1.00</td>
                <td>1.00</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Chemotherapy</td>
                <td colspan="2">0.98 (0.89-0.99)</td>
                <td colspan="2">0.75</td>
                <td colspan="2">1.00</td>
                <td colspan="2">1.00</td>
                <td>0.98</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Other immunosuppressive drugs</td>
                <td colspan="2">0.98 (0.89-0.99)</td>
                <td colspan="2">0.67</td>
                <td colspan="2">1.00</td>
                <td colspan="2">1.00</td>
                <td>0.98</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Cancer</td>
                <td colspan="2">1.00 (0.93-1.00)</td>
                <td colspan="2">1.00</td>
                <td colspan="2">1.00</td>
                <td colspan="2">1.00</td>
                <td>1.00</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Diabetes</td>
                <td colspan="2">0.98 (0.89-0.99)</td>
                <td colspan="2">0.86</td>
                <td colspan="2">1.00</td>
                <td colspan="2">1.00</td>
                <td>0.98</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Malnutrition</td>
                <td colspan="2">0.94 (0.83-0.99)</td>
                <td colspan="2">0.00</td>
                <td colspan="2">0.98</td>
                <td colspan="2">0.00</td>
                <td>0.96</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Other immunosuppressive conditions</td>
                <td colspan="2">0.98 (0.89-0.99)</td>
                <td colspan="2">0.5</td>
                <td colspan="2">1.00</td>
                <td colspan="2">1.00</td>
                <td>0.98</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Marginalized</td>
                <td colspan="2">0.98 (0.89-0.99)</td>
                <td colspan="2">0.75 (0.50)</td>
                <td colspan="2">0.95 (0.10)</td>
                <td colspan="2">0.99 (0.01)</td>
                <td>0.99 (0.01)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Health care facility</td>
                <td colspan="2">0.92 (0.80-0.97)</td>
                <td colspan="2">0.50 (0.50)</td>
                <td colspan="2">0.86 (0.29)</td>
                <td colspan="2">0.95 (0.06)</td>
                <td>0.97 (0.03)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="5">
                  <bold>Pulmonary acid fast bacillus</bold>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td colspan="2">Positive</td>
                <td colspan="2">0.92 (0.80-0.98)</td>
                <td colspan="2">0.25</td>
                <td colspan="2">0.98</td>
                <td colspan="2">0.50</td>
                <td>0.93</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td colspan="2">Negative</td>
                <td colspan="2">0.96 (0.86-0.99)</td>
                <td colspan="2">1.00</td>
                <td colspan="2">0.95</td>
                <td colspan="2">0.67</td>
                <td>1.00</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Extrapulmonary (other than lymphadenitis)</td>
                <td colspan="2">0.96 (0.86-0.99)</td>
                <td colspan="2">0.50</td>
                <td colspan="2">1.00</td>
                <td colspan="2">1.00</td>
                <td>0.95</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Lymphadenitis</td>
                <td colspan="2">1.00 (0.93-1.00)</td>
                <td colspan="2">1.00</td>
                <td colspan="2">1.00</td>
                <td colspan="2">1.00</td>
                <td>1.00</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Disseminated</td>
                <td colspan="2">1.00 (0.93-1.00)</td>
                <td colspan="2">N/A<sup>c</sup></td>
                <td colspan="2">1.00</td>
                <td colspan="2">N/A</td>
                <td>N/A</td>
              </tr>
              <tr valign="top">
                <td colspan="13">
                  <bold>Complex features</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Active TB disease</td>
                <td colspan="2">1.00 (0.93-1.00)</td>
                <td colspan="2">1.00</td>
                <td colspan="2">1.00</td>
                <td colspan="2">1.00</td>
                <td>1.00</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Latent TB infection</td>
                <td colspan="2">0.84 (0.70-0.93)</td>
                <td colspan="2">0.90</td>
                <td colspan="2">0.79</td>
                <td colspan="2">0.76</td>
                <td>0.92</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Pulmonary nontuberculous mycobacteria</td>
                <td colspan="2">1.00 (0.93-1.00)</td>
                <td colspan="2">1.00</td>
                <td colspan="2">1.00</td>
                <td colspan="2">1.00</td>
                <td>1.00</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">
                  <bold>Adverse drug reaction</bold>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td colspan="2">Gastrointestinal</td>
                <td colspan="2">0.90 (0.78-0.97)</td>
                <td colspan="2">1.00</td>
                <td colspan="2">0.84</td>
                <td colspan="2">0.78</td>
                <td>1.00</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td colspan="2">Peripheral neuropathy</td>
                <td colspan="2">1.00 (0.93-1.00)</td>
                <td colspan="2">1.00</td>
                <td colspan="2">1.00</td>
                <td colspan="2">1.00</td>
                <td>1.00</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td colspan="2">Rash</td>
                <td colspan="2">0.90 (0.78-0.97)</td>
                <td colspan="2">1.00</td>
                <td colspan="2">0.89</td>
                <td colspan="2">0.50</td>
                <td>1.00</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td colspan="2">Other</td>
                <td colspan="2">0.97 (0.89-0.99)</td>
                <td colspan="2">1.00</td>
                <td colspan="2">0.98</td>
                <td colspan="2">0.50</td>
                <td>1.00</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td colspan="2">Ocular toxicity</td>
                <td colspan="2">0.90 (0.75-0.97)</td>
                <td colspan="2">0.00</td>
                <td colspan="2">0.92</td>
                <td colspan="2">0.00</td>
                <td>0.98</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table5fn1">
              <p><sup>a</sup>Values within parenthesis are standard deviation values.</p>
            </fn>
            <fn id="table5fn2">
              <p><sup>b</sup>TB: tuberculosis.</p>
            </fn>
            <fn id="table5fn3">
              <p><sup>c</sup>N/A: not applicable.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>The findings of this study suggest that a commercially available NLP tool can perform very well when compared with the reference standard of manual chart review in extracting useful clinical information from digital text notes in our TB clinic with limited training. This was especially true in the case of straightforward findings, such as prescribed medications, smoking status, country of birth, year of immigration, and sputum conversion date. Unsurprisingly, accuracy decreased slightly as clinical features became more complex, but it remained over 90% for complex features.</p>
        <p>One notable finding is that although NLP performed extremely well with respect to specificity and NPV for moderate and complex findings, sensitivity and PPV were considerably lower. These results are in keeping with other studies using free-format clinical notes for complex feature extraction, such as the study by Perlis et al, who reported a sensitivity of 42% and PPV of 78% for the detection of depression [<xref ref-type="bibr" rid="ref8">8</xref>]. However, these findings are in contrast to the high sensitivity and PPV reported in studies looking at radiology reports, such as the study by Al-Haddad et al, who demonstrated a sensitivity of 97% and PPV of 95% in the detection of intraductal papillary mucinous neoplasms [<xref ref-type="bibr" rid="ref10">10</xref>]. This discrepancy may be either because of differences in complexity of features or because of differences inherent between radiology reports, which are relatively structured, often with minimal variability from practitioner to practitioner, versus free-format clinical notes, which have less structure and greater variability across practitioners.</p>
        <p>In terms of ease of use of a commercially available tool, deploying Pentavere’s DARWEN in our environment was a straightforward installation of their application on a desktop computer. The iterative tuning and relationship modeling for all clinical features took our NLP engineer roughly 4 weeks to complete. The tuning required roughly 6 hours of clinician time to provide clinical context for the NLP engineer, confirm clinical validity of heuristic rules, and perform arbitration of discrepancies between chart review and NLP.</p>
      </sec>
      <sec>
        <title>Strengths and Limitations</title>
        <p>Our study is novel in several ways. First, to our knowledge, this is only the third study to explore the validity of NLP for the identification of TB patients and the first to examine dictated consult notes versus radiological reports and structured laboratory results for this purpose [<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref19">19</xref>]. Second, research on NLP applications in medicine tend to focus on only a single clinical condition such as the presence of a tumor [<xref ref-type="bibr" rid="ref10">10</xref>], a diagnosis such as depression [<xref ref-type="bibr" rid="ref8">8</xref>], or a social condition such as homelessness [<xref ref-type="bibr" rid="ref9">9</xref>]. In contrast, our study is substantially broader compared with other more commonly published studies, looking at 15 distinct medical and social features. Finally, our study is one of the few to evaluate the performance of a commercially available NLP tool [<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref7">7</xref>,<xref ref-type="bibr" rid="ref12">12</xref>].</p>
        <p>Our study has several limitations. First, review of the feature-level analysis reveals that some dichotomous features had very low incidence, making sensitivity and PPV very sensitive to error. Second, our choice to randomly sample for our initial training dataset (n=30) resulted in an undersampling of cases of ocular toxicity because of adverse drug reaction. As a result, the NLP tool was never trained on this feature and subsequently performed poorly for this feature during the final testing set, potentially underestimating the effectiveness of a properly trained tool. This suggests that a real-world application of this technology may require a more purposive sampling strategy than our random sampling approach. Third, our study employed only a single chart abstractor and a single adjudicator. Finally, this study was conducted at a single center, in a focused clinical area, and with a relatively small final test sample (n=49), which may limit the generalizability of our findings. However, the goal of this pilot study was to establish the feasibility of using NLP to extract clinical features from dictated consult notes and to inform the approach to larger future studies.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>NLP technology has been advancing quickly in recent years, and the potential clinical applications are numerous. The findings of this study support the application of extracting clinical features from dictated consult notes in the setting of a TB clinic. Further research is needed to fully establish the validity of NLP for this and other purposes. However, its application to free-format consult notes may be of particular benefit, as it offers a course whereby clinicians can document in their preferred method of narrative free text, with data still available for applications such as research and program quality control initiatives, for example, without the cost and effort of manual chart review.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Corpus sample (synthetic consult notes).</p>
        <media xlink:href="medinform_v7i4e12575_app1.pdf" xlink:title="PDF File  (Adobe PDF File), 219 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">AFB</term>
          <def>
            <p>acid fast bacilli</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">EHR</term>
          <def>
            <p>electronic health record</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">NER</term>
          <def>
            <p>named entity recognition</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">NLP</term>
          <def>
            <p>natural language processing</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">NPV</term>
          <def>
            <p>negative predictive value</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">PPV</term>
          <def>
            <p>positive predictive value</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">TB</term>
          <def>
            <p>tuberculosis</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="web">
          <source>Health IT Dashboard</source>
          <year>2017</year>
          <access-date>2018-08-12</access-date>
          <comment>Office-Based Physician Electronic Health Record Adoption <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dashboard.healthit.gov/quickstats/pages/physician-ehr-adoption-trends.php">https://dashboard.healthit.gov/quickstats/pages/physician-ehr-adoption-trends.php</ext-link>
                                                </comment>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Henry</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Pylypchuk</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Searcy</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Patel</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <source>Health IT Dashboard</source>
          <year>2016</year>
          <access-date>2018-08-12</access-date>
          <comment>Adoption of Electronic Health Record Systems among US Non-Federal Acute Care Hospitals: 2008-2015 <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dashboard.healthit.gov/evaluations/data-briefs/non-federal-acute-care-hospital-ehr-adoption-2008-2015.php">https://dashboard.healthit.gov/evaluations/data-briefs/non-federal-acute-care-hospital-ehr-adoption-2008-2015.php</ext-link>
                                                </comment>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>van Velthoven</surname>
              <given-names>MH</given-names>
            </name>
            <name name-style="western">
              <surname>Mastellos</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Majeed</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>O'Donoghue</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Car</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Feasibility of extracting data from electronic medical records for research: an international comparative study</article-title>
          <source>BMC Med Inform Decis Mak</source>
          <year>2016</year>
          <month>07</month>
          <day>13</day>
          <volume>16</volume>
          <fpage>90</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedinformdecismak.biomedcentral.com/articles/10.1186/s12911-016-0332-1"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12911-016-0332-1</pub-id>
          <pub-id pub-id-type="medline">27411943</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12911-016-0332-1</pub-id>
          <pub-id pub-id-type="pmcid">PMC4944506</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pons</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Braun</surname>
              <given-names>LM</given-names>
            </name>
            <name name-style="western">
              <surname>Hunink</surname>
              <given-names>MG</given-names>
            </name>
            <name name-style="western">
              <surname>Kors</surname>
              <given-names>JA</given-names>
            </name>
          </person-group>
          <article-title>Natural language processing in radiology: a systematic review</article-title>
          <source>Radiology</source>
          <year>2016</year>
          <month>05</month>
          <volume>279</volume>
          <issue>2</issue>
          <fpage>329</fpage>
          <lpage>43</lpage>
          <pub-id pub-id-type="doi">10.1148/radiol.16142770</pub-id>
          <pub-id pub-id-type="medline">27089187</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zeng</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Espino</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Roy</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Khan</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Clare</surname>
              <given-names>SE</given-names>
            </name>
            <name name-style="western">
              <surname>Jiang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Neapolitan</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Luo</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Using natural language processing and machine learning to identify breast cancer local recurrence</article-title>
          <source>BMC Bioinformatics</source>
          <year>2018</year>
          <month>12</month>
          <day>28</day>
          <volume>19</volume>
          <issue>Suppl 17</issue>
          <fpage>498</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcbioinformatics.biomedcentral.com/articles/10.1186/s12859-018-2466-x"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12859-018-2466-x</pub-id>
          <pub-id pub-id-type="medline">30591037</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12859-018-2466-x</pub-id>
          <pub-id pub-id-type="pmcid">PMC6309052</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>VJ</given-names>
            </name>
            <name name-style="western">
              <surname>Lenert</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Bunnell</surname>
              <given-names>BE</given-names>
            </name>
            <name name-style="western">
              <surname>Obeid</surname>
              <given-names>JS</given-names>
            </name>
            <name name-style="western">
              <surname>Jefferson</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Halbert</surname>
              <given-names>CH</given-names>
            </name>
          </person-group>
          <article-title>Automatically identifying social isolation from clinical narratives for patients with prostate cancer</article-title>
          <source>BMC Med Inform Decis Mak</source>
          <year>2019</year>
          <month>03</month>
          <day>14</day>
          <volume>19</volume>
          <issue>1</issue>
          <fpage>43</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedinformdecismak.biomedcentral.com/articles/10.1186/s12911-019-0795-y"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12911-019-0795-y</pub-id>
          <pub-id pub-id-type="medline">30871518</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12911-019-0795-y</pub-id>
          <pub-id pub-id-type="pmcid">PMC6416852</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>VJ</given-names>
            </name>
            <name name-style="western">
              <surname>Walker</surname>
              <given-names>TD</given-names>
            </name>
            <name name-style="western">
              <surname>Warren</surname>
              <given-names>RW</given-names>
            </name>
            <name name-style="western">
              <surname>Jenny</surname>
              <given-names>PB</given-names>
            </name>
            <name name-style="western">
              <surname>Meystre</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Lenert</surname>
              <given-names>LA</given-names>
            </name>
          </person-group>
          <article-title>Identifying falls risk screenings not documented with administrative codes using natural language processing</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2017</year>
          <volume>2017</volume>
          <fpage>1923</fpage>
          <lpage>30</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/29854264"/>
          </comment>
          <pub-id pub-id-type="medline">29854264</pub-id>
          <pub-id pub-id-type="pmcid">PMC5977708</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Perlis</surname>
              <given-names>RH</given-names>
            </name>
            <name name-style="western">
              <surname>Iosifescu</surname>
              <given-names>DV</given-names>
            </name>
            <name name-style="western">
              <surname>Castro</surname>
              <given-names>VM</given-names>
            </name>
            <name name-style="western">
              <surname>Murphy</surname>
              <given-names>SN</given-names>
            </name>
            <name name-style="western">
              <surname>Gainer</surname>
              <given-names>VS</given-names>
            </name>
            <name name-style="western">
              <surname>Minnier</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Cai</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Goryachev</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zeng</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Gallagher</surname>
              <given-names>PJ</given-names>
            </name>
            <name name-style="western">
              <surname>Fava</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Weilburg</surname>
              <given-names>JB</given-names>
            </name>
            <name name-style="western">
              <surname>Churchill</surname>
              <given-names>SE</given-names>
            </name>
            <name name-style="western">
              <surname>Kohane</surname>
              <given-names>IS</given-names>
            </name>
            <name name-style="western">
              <surname>Smoller</surname>
              <given-names>JW</given-names>
            </name>
          </person-group>
          <article-title>Using electronic medical records to enable large-scale studies in psychiatry: treatment resistant depression as a model</article-title>
          <source>Psychol Med</source>
          <year>2012</year>
          <month>01</month>
          <volume>42</volume>
          <issue>1</issue>
          <fpage>41</fpage>
          <lpage>50</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/21682950"/>
          </comment>
          <pub-id pub-id-type="doi">10.1017/S0033291711000997</pub-id>
          <pub-id pub-id-type="medline">21682950</pub-id>
          <pub-id pub-id-type="pii">S0033291711000997</pub-id>
          <pub-id pub-id-type="pmcid">PMC3837420</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gundlapalli</surname>
              <given-names>AV</given-names>
            </name>
            <name name-style="western">
              <surname>Carter</surname>
              <given-names>ME</given-names>
            </name>
            <name name-style="western">
              <surname>Divita</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Shen</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Palmer</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>South</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Durgahee</surname>
              <given-names>BS</given-names>
            </name>
            <name name-style="western">
              <surname>Redd</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Samore</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Extracting concepts related to homelessness from the free text of VA electronic medical records</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2014</year>
          <volume>2014</volume>
          <fpage>589</fpage>
          <lpage>98</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/25954364"/>
          </comment>
          <pub-id pub-id-type="medline">25954364</pub-id>
          <pub-id pub-id-type="pmcid">PMC4419940</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Al-Haddad</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Friedlin</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kesterson</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Waters</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Aguilar-Saavedra</surname>
              <given-names>JR</given-names>
            </name>
            <name name-style="western">
              <surname>Schmidt</surname>
              <given-names>CM</given-names>
            </name>
          </person-group>
          <article-title>Natural language processing for the development of a clinical registry: a validation study in intraductal papillary mucinous neoplasms</article-title>
          <source>HPB (Oxford)</source>
          <year>2010</year>
          <month>12</month>
          <volume>12</volume>
          <issue>10</issue>
          <fpage>688</fpage>
          <lpage>95</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1365-182X(15)30257-4"/>
          </comment>
          <pub-id pub-id-type="doi">10.1111/j.1477-2574.2010.00235.x</pub-id>
          <pub-id pub-id-type="medline">21083794</pub-id>
          <pub-id pub-id-type="pii">S1365-182X(15)30257-4</pub-id>
          <pub-id pub-id-type="pmcid">PMC3003479</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Pakhomov</surname>
              <given-names>SV</given-names>
            </name>
            <name name-style="western">
              <surname>Arsoniadis</surname>
              <given-names>EG</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>JT</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Melton</surname>
              <given-names>GB</given-names>
            </name>
          </person-group>
          <article-title>Detecting clinically relevant new information in clinical notes across specialties and settings</article-title>
          <source>BMC Med Inform Decis Mak</source>
          <year>2017</year>
          <month>07</month>
          <day>5</day>
          <volume>17</volume>
          <issue>Suppl 2</issue>
          <fpage>68</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedinformdecismak.biomedcentral.com/articles/10.1186/s12911-017-0464-y"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12911-017-0464-y</pub-id>
          <pub-id pub-id-type="medline">28699564</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12911-017-0464-y</pub-id>
          <pub-id pub-id-type="pmcid">PMC5506580</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Levine</surname>
              <given-names>MN</given-names>
            </name>
            <name name-style="western">
              <surname>Alexander</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Sathiyapalan</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Agrawal</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Pond</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Learning health system for breast cancer: pilot project experience</article-title>
          <source>JCO Clin Cancer Inform</source>
          <year>2019</year>
          <month>08</month>
          <volume>3</volume>
          <fpage>1</fpage>
          <lpage>11</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://ascopubs.org/doi/full/10.1200/CCI.19.00032?url_ver=Z39.88-2003&#38;rfr_id=ori:rid:crossref.org&#38;rfr_dat=cr_pub%3dpubmed"/>
          </comment>
          <pub-id pub-id-type="doi">10.1200/CCI.19.00032</pub-id>
          <pub-id pub-id-type="medline">31369338</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Brin</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Extracting Patterns and Relations from the World Wide Web</article-title>
          <source>Proceedings of the International Workshop on the World Wide Web and Databases</source>
          <year>1998</year>
          <conf-name>WebDB'98</conf-name>
          <conf-date>March 27-28, 1998</conf-date>
          <conf-loc>Valencia, Spain</conf-loc>
          <fpage>172</fpage>
          <lpage>83</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1007/10704656_11"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/10704656_11</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shapiro</surname>
              <given-names>DE</given-names>
            </name>
          </person-group>
          <article-title>The interpretation of diagnostic tests</article-title>
          <source>Stat Methods Med Res</source>
          <year>1999</year>
          <month>06</month>
          <volume>8</volume>
          <issue>2</issue>
          <fpage>113</fpage>
          <lpage>34</lpage>
          <pub-id pub-id-type="doi">10.1177/096228029900800203</pub-id>
          <pub-id pub-id-type="medline">10501649</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Altman</surname>
              <given-names>DG</given-names>
            </name>
            <name name-style="western">
              <surname>Bland</surname>
              <given-names>JM</given-names>
            </name>
          </person-group>
          <article-title>Diagnostic tests. 1: sensitivity and specificity</article-title>
          <source>Br Med J</source>
          <year>1994</year>
          <month>06</month>
          <day>11</day>
          <volume>308</volume>
          <issue>6943</issue>
          <fpage>1552</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/8019315"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/bmj.308.6943.1552</pub-id>
          <pub-id pub-id-type="medline">8019315</pub-id>
          <pub-id pub-id-type="pmcid">PMC2540489</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Altman</surname>
              <given-names>DG</given-names>
            </name>
            <name name-style="western">
              <surname>Bland</surname>
              <given-names>JM</given-names>
            </name>
          </person-group>
          <article-title>Diagnostic tests 2: predictive values</article-title>
          <source>Br Med J</source>
          <year>1994</year>
          <month>07</month>
          <day>9</day>
          <volume>309</volume>
          <issue>6947</issue>
          <fpage>102</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/8038641"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/bmj.309.6947.102</pub-id>
          <pub-id pub-id-type="medline">8038641</pub-id>
          <pub-id pub-id-type="pmcid">PMC2540558</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gardner</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Altman</surname>
              <given-names>DG</given-names>
            </name>
          </person-group>
          <article-title>Confidence intervals rather than <italic>P</italic> values: estimation rather than hypothesis testing</article-title>
          <source>Br Med J (Clin Res Ed)</source>
          <year>1986</year>
          <month>03</month>
          <day>15</day>
          <volume>292</volume>
          <issue>6522</issue>
          <fpage>746</fpage>
          <lpage>50</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/3082422"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/bmj.292.6522.746</pub-id>
          <pub-id pub-id-type="medline">3082422</pub-id>
          <pub-id pub-id-type="pmcid">PMC1339793</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jain</surname>
              <given-names>NL</given-names>
            </name>
            <name name-style="western">
              <surname>Knirsch</surname>
              <given-names>CA</given-names>
            </name>
            <name name-style="western">
              <surname>Friedman</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Hripcsak</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Identification of suspected tuberculosis patients based on natural language processing of chest radiograph reports</article-title>
          <source>Proc AMIA Annu Fall Symp</source>
          <year>1996</year>
          <fpage>542</fpage>
          <lpage>6</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/8947725"/>
          </comment>
          <pub-id pub-id-type="medline">8947725</pub-id>
          <pub-id pub-id-type="pmcid">PMC2233236</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hripcsak</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Knirsch</surname>
              <given-names>CA</given-names>
            </name>
            <name name-style="western">
              <surname>Jain</surname>
              <given-names>NL</given-names>
            </name>
            <name name-style="western">
              <surname>Pablos-Mendez</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Automated tuberculosis detection</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>1997</year>
          <volume>4</volume>
          <issue>5</issue>
          <fpage>376</fpage>
          <lpage>81</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/9292843"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/jamia.1997.0040376</pub-id>
          <pub-id pub-id-type="medline">9292843</pub-id>
          <pub-id pub-id-type="pmcid">PMC61255</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
