<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMI</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Med Inform</journal-id>
      <journal-title>JMIR Medical Informatics</journal-title>
      <issn pub-type="epub">2291-9694</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v9i2e18756</article-id>
      <article-id pub-id-type="pmid">33605893</article-id>
      <article-id pub-id-type="doi">10.2196/18756</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Measuring Adoption of Patient Priorities–Aligned Care Using Natural Language Processing of Electronic Health Records: Development and Validation of the Model</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Shen</surname>
            <given-names>Feichen</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Coquet</surname>
            <given-names>Jean</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Pollettini</surname>
            <given-names>Juliana T</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Rousseau</surname>
            <given-names>Justin</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" corresp="yes" equal-contrib="yes">
          <name name-style="western">
            <surname>Razjouyan</surname>
            <given-names>Javad</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>VA Health Services Research and Development Service</institution>
            <institution>Center for Innovations in Quality, Effectiveness and Safety</institution>
            <institution>Michael E DeBakey VA Medical Center</institution>
            <addr-line>2002 Holcombe Blvd</addr-line>
            <addr-line>Houston, TX, 77030</addr-line>
            <country>United States</country>
            <phone>1 5203424525</phone>
            <email>javad.razjouyan@bcm.edu</email>
          </address>
          <xref rid="aff2" ref-type="aff">2</xref>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-1157-159X</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Freytag</surname>
            <given-names>Jennifer</given-names>
          </name>
          <degrees>JD, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-3169-8432</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Dindo</surname>
            <given-names>Lilian</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-3277-947X</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Kiefer</surname>
            <given-names>Lea</given-names>
          </name>
          <degrees>MPH</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-1374-7835</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Odom</surname>
            <given-names>Edward</given-names>
          </name>
          <degrees>BS</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-7376-0674</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author">
          <name name-style="western">
            <surname>Halaszynski</surname>
            <given-names>Jaime</given-names>
          </name>
          <degrees>LCSW</degrees>
          <xref rid="aff4" ref-type="aff">4</xref>
          <xref rid="aff5" ref-type="aff">5</xref>
          <xref rid="aff6" ref-type="aff">6</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-3439-0580</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author">
          <name name-style="western">
            <surname>Silva</surname>
            <given-names>Jennifer W</given-names>
          </name>
          <degrees>LCSW</degrees>
          <xref rid="aff5" ref-type="aff">5</xref>
          <xref rid="aff6" ref-type="aff">6</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-9352-609X</ext-link>
        </contrib>
        <contrib id="contrib8" contrib-type="author">
          <name name-style="western">
            <surname>Naik</surname>
            <given-names>Aanand D</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <xref rid="aff3" ref-type="aff">3</xref>
          <xref rid="aff7" ref-type="aff">7</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-6936-7984</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>VA Health Services Research and Development Service</institution>
        <institution>Center for Innovations in Quality, Effectiveness and Safety</institution>
        <institution>Michael E DeBakey VA Medical Center</institution>
        <addr-line>Houston, TX</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Department of Medicine</institution>
        <institution>Baylor College of Medicine</institution>
        <addr-line>Houston, TX</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Big Data Scientist Training Enhancement Program (BD-STEP)</institution>
        <institution>VA Office of Research and Development</institution>
        <addr-line>Washington, DC</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>Social Work Service</institution>
        <institution>Butler VA Health Care System</institution>
        <addr-line>Butler, PA</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff5">
        <label>5</label>
        <institution>VA National Social Work Program Office, Care Management and Social Work</institution>
        <institution>Patient Care Services</institution>
        <institution>Department of Veterans Affairs</institution>
        <addr-line>Washington, DC</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff6">
        <label>6</label>
        <institution>VA Tennessee Valley Healthcare System</institution>
        <addr-line>Nashville, TN</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff7">
        <label>7</label>
        <institution>VA Quality Scholars Coordinating Center</institution>
        <institution>IQuESt</institution>
        <institution>Michael E DeBakey VA Medical Center</institution>
        <addr-line>Houston, TX</addr-line>
        <country>United States</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Javad Razjouyan <email>javad.razjouyan@bcm.edu</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <month>2</month>
        <year>2021</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>19</day>
        <month>2</month>
        <year>2021</year>
      </pub-date>
      <volume>9</volume>
      <issue>2</issue>
      <elocation-id>e18756</elocation-id>
      <history>
        <date date-type="received">
          <day>16</day>
          <month>3</month>
          <year>2020</year>
        </date>
        <date date-type="rev-request">
          <day>15</day>
          <month>6</month>
          <year>2020</year>
        </date>
        <date date-type="rev-recd">
          <day>16</day>
          <month>11</month>
          <year>2020</year>
        </date>
        <date date-type="accepted">
          <day>17</day>
          <month>12</month>
          <year>2020</year>
        </date>
      </history>
      <copyright-statement>©Javad Razjouyan, Jennifer Freytag, Lilian Dindo, Lea Kiefer, Edward Odom, Jaime Halaszynski, Jennifer W Silva, Aanand D Naik. Originally published in JMIR Medical Informatics (http://medinform.jmir.org), 19.02.2021.</copyright-statement>
      <copyright-year>2021</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Informatics, is properly cited. The complete bibliographic information, a link to the original publication on http://medinform.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://medinform.jmir.org/2021/2/e18756" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Patient Priorities Care (PPC) is a model of care that aligns health care recommendations with priorities of older adults who have multiple chronic conditions. Following identification of patient priorities, this information is documented in the patient’s electronic health record (EHR).</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>Our goal is to develop and validate a natural language processing (NLP) model that reliably documents when clinicians identify patient priorities (ie, values, outcome goals, and care preferences) within the EHR as a measure of PPC adoption.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>This is a retrospective analysis of unstructured National Veteran Health Administration EHR free-text notes using an NLP model. The data were sourced from 778 patient notes of 658 patients from encounters with 144 social workers in the primary care setting. Each patient’s free-text clinical note was reviewed by 2 independent reviewers for the presence of PPC language such as priorities, values, and goals. We developed an NLP model that utilized statistical machine learning approaches. The performance of the NLP model in training and validation with 10-fold cross-validation is reported via accuracy, recall, and precision in comparison to the chart review.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>Of 778 notes, 589 (75.7%) were identified as containing PPC language (kappa=0.82, <italic>P</italic>&#60;.001). The NLP model in the training stage had an accuracy of 0.98 (95% CI 0.98-0.99), a recall of 0.98 (95% CI 0.98-0.99), and precision of 0.98 (95% CI 0.97-1.00). The NLP model in the validation stage had an accuracy of 0.92 (95% CI 0.90-0.94), recall of 0.84 (95% CI 0.79-0.89), and precision of 0.84 (95% CI 0.77-0.91). In contrast, an approach using simple search terms for PPC only had a precision of 0.757.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>An automated NLP model can reliably measure with high precision, recall, and accuracy when clinicians document patient priorities as a key step in the adoption of PPC.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>natural language processing</kwd>
        <kwd>NLP</kwd>
        <kwd>social work note</kwd>
        <kwd>decision support</kwd>
        <kwd>machine learning</kwd>
        <kwd>pattern recognition</kwd>
        <kwd>geriatric decision support system</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>Older adults with multiple chronic conditions (MCC) frequently receive some of the most intensive and expensive health care, much of which is of uncertain benefit [<xref ref-type="bibr" rid="ref1">1</xref>-<xref ref-type="bibr" rid="ref3">3</xref>]. Care for these patients is often inconsistent and fragmented because the multiple specialists they see provide care based on single disease guidelines that do not take into account the complexities of MCC. Moreover, it often does not address what matters most to patients [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref2">2</xref>]. With input from patients, caregivers, clinicians, health system leaders, payers, and health care design experts, we developed Patient Priorities Care (PPC), which involves identifying, documenting, and providing care consistent with patients’ health priorities [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref5">5</xref>]. PPC is an intervention that aims to help clinicians provide health care to older patients with MCC that aligns with their priorities, which include their individual values (what matters most), desired outcome goals, and health care preferences [<xref ref-type="bibr" rid="ref1">1</xref>-<xref ref-type="bibr" rid="ref6">6</xref>].</p>
      <p>In the PPC process, there are 3 key steps. First, a trained facilitator works with each patient to identify the patient’s health care priorities: their values, outcome goals, and health care preferences [<xref ref-type="bibr" rid="ref1">1</xref>-<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref5">5</xref>]. Values are the people, things, activities, and capabilities <italic>that matter most</italic> to a person, such as connecting with others, independence, enjoying life, and balancing quality and quantity of life [<xref ref-type="bibr" rid="ref7">7</xref>,<xref ref-type="bibr" rid="ref8">8</xref>]. Patient values provide the basis for setting specific, measurable, attainable, realistic, and timely outcome goals (SMART goals). Health care preferences are the activities a patient is willing (or not willing) to do to reach their outcome goals. The second key step in PPC involves documenting patient priorities in the patient’s electronic health record (EHR) [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref5">5</xref>]. This makes information about patient priorities available to different clinicians working with adults with MCC. In the final step of PPC, the clinician uses documented patient priorities to make treatment decisions that align with patient priorities [<xref ref-type="bibr" rid="ref3">3</xref>].</p>
      <p>Social workers frequently serve as facilitators in the PPC approach. Social workers use a holistic approach and encourage self-determination while promoting dignity and worth of the individual. They are also uniquely qualified to provide a wide array of quality social work interventions, including care coordination, case management, individual and group therapy, and supportive counseling for older adults with MCC. Social workers address social determinants of health and provide proactive interventions for social conditions that contribute to poor health outcomes. Social workers facilitate communication between the patient and health care provider and act as an advocate on behalf of the patient.</p>
      <p>The PPC process thus relies on identifying and documenting patient priorities in the EHR so facilitators can share priorities with other clinicians. This documentation is done in the free text of individual visit notes. To measure adoption of PPC, the free text of clinician notes must be analyzed. Analyzing the free-text notes as yes (PPC present) or no (PPC not present) is entitled as text classification [<xref ref-type="bibr" rid="ref9">9</xref>]. Although the gold standard for text classification is human chart review, it is tedious, time consuming, expensive, and potentially risks patient privacy [<xref ref-type="bibr" rid="ref10">10</xref>]. To overcome these limitations, natural language processing (NLP) has been introduced as an alternative or adjunct to manual chart abstraction [<xref ref-type="bibr" rid="ref10">10</xref>]. NLP refers to the computational methods of concepts, entities, events, and relations extraction from free text [<xref ref-type="bibr" rid="ref11">11</xref>]. NLP algorithms are used in a wide spectrum of health care–related purposes such as identifying disease risk factors, evaluating efficiency of care and costs, and extracting information from clinical notes [<xref ref-type="bibr" rid="ref12">12</xref>].</p>
      <p>The first aim of this study was to develop an NLP algorithm capable of confirming social worker use of PPC in the free-text notes of patients’ EHRs. We hypothesized that the NLP model could confirm documentation of patient priorities in the free text of facilitator notes. We compared the performance of the NLP model with a chart‐reviewed reference standard by reporting performance measures (ie, accuracy, recall, specificity, precision, negative predictive value). To further evaluate the performance of the NLP algorithm, we compared its accuracy to a simple search terms approach. We also used the NLP algorithm to monitor the uptake of PPC among trained social workers following dedicated training sessions and track the persistence of PPC adoption over time.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Overview</title>
        <p>To create the NLP model to assess the adoption of PPC, we used the notes of a cohort of social workers who were trained to be PPC clinicians over the course of 9 months. This cohort of social workers was hired through the VA Social Work in Patient Aligned Care Teams (PACT) Staffing Program. This program was developed in May 2016 and is the result of a partnership between the Veterans Health Administration (VHA) National Social Work Program Office and the Office of Rural Health. The goal of the program is to embed social workers in rural and highly rural areas to increase Veteran access to high-quality social work services. The innovative program supports the Office of Rural Health’s mission of breaking down barriers separating rural Veterans from high-quality care. Social workers are often one of the first clinicians a Veteran has contact with in the VHA. Social workers in this program provide interventions at numerous rural health VHA medical centers and outpatient clinics across the nation. Two cohorts of social workers were trained: 56 social workers from 5 VA health care systems in 2018 and 88 social workers from 12 VA health care systems in 2019. Social workers were trained to assess, evaluate, and select patients who were good candidates for PPC. Patients had to be older than 60 years of age and have at least two primary care encounters in a prior year. Social workers were trained to facilitate PPC conversations using patient and facilitator workbooks. Social workers were instructed to document all PPC-related interactions in the patient free-text note including all components of PPC. A PPC rubric was provided to social workers to document components of PPC: patient values, outcome goals, and health care preferences (see <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). After reviewing the PPC template and related notes, we recognized that all notes must have 2 phrases: “goal” and “value.” Notes without these 2 expressions are not considered as PPC.</p>
      </sec>
      <sec>
        <title>Data Collection (Search Term Approach)</title>
        <p>Notes of eligible patients were retrieved from the VHA Corporate Data Warehouse [<xref ref-type="bibr" rid="ref13">13</xref>]. First, notes of all patients who visited with a PPC-trained social worker were retrieved from the Corporate Data Warehouse and included in a database. Notes were obtained from the first facilitated PPC visit through the end of the 2019 calendar year. The Baylor College of Medicine Institutional Review Board and the Veterans Affairs research service (IRB# H-41886) approved this study. Access to patients' data was granted through the Veterans Informatics and Computing Infrastructure.</p>
      </sec>
      <sec>
        <title>The Reference Standard</title>
        <p>To develop the NLP algorithm, we extracted 778 notes from 658 patients who were seen by the social workers. We developed a reference standard for identifying PPC using a formal chart review. We provided complete copies of the notes from the 2018 and 2019 cohorts to 2 independent reviewers (EO and JF). The reviewers ensured the existence of language for values, outcome goals, and care preferences for each free-text note. Charts were labeled as 0 or 1; 0 refers to absence of documented patient priorities for the patient’s note, and 1 refers to documentation of priorities in free-text notes of patients. Any disagreement between reviewers was resolved by a third reviewer, a geriatrician involved in the development of PPC (AN). The agreement among reviewers is reported using the kappa statistic, and the significance level was set at <italic>P&#60;</italic>.05; statistical analysis was conducted using SPSS software.</p>
      </sec>
      <sec>
        <title>NLP Algorithm</title>
        <p>The NLP algorithm was developed using 3 steps: preprocessing, processing, and postprocessing (<xref rid="figure1" ref-type="fig">Figure 1</xref>). In the preprocessing step, we cleaned the text, performed features extraction, and reduced the number of features to reduce the size of the feature space (dimensionality reduction). In the processing step, we developed a classification model to identify the yes-PPC from no-PPC notes. In postprocessing, we reported the performance models developed in the processing step and assessed the generalizability of the model.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Process of developing the natural language processing (NLP) algorithm: (A) retrieving 106,505 notes from trained social workers after the first training workshop; (B) searching notes for existence of 2 expressions “goal” and “value,” which resulted into 778 notes; (C) review and resolution of disagreements; (D) labeling of notes as yes-Patient Priorities Care (PPC; 1) or no-PPC (0); (E) development of NLP algorithm.</p>
          </caption>
          <graphic xlink:href="medinform_v9i2e18756_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <sec>
          <title>Preprocessing, Cleaning the Text</title>
          <p>We converted the stream of text into meaningful elements such as words, phrases, and symbols, called tokenization. We added the part of speech (eg, noun, verb, and pronoun) to each word. We removed stop words (eg, articles, conjunctions, and prepositions) and punctuation as they do not contain informational content. Words were normalized by reducing words to their word stem (stemming technique). For example, the words caregiver, caregivers, and caregiving would be reduced to “caregiv.“</p>
        </sec>
        <sec>
          <title>Cleaning, Features Extraction, and Feature Reduction</title>
          <p>To extract features from the text, we used “bag-of-words” (BoW). BoW (also known as a term-frequency counter) records the number of times that each individual word (unigram) appears in a document. We excluded unigrams with a frequency ≤2. These words must appear in the entire sentence related to goals and values &#60;2 times (<xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref> visualizes the BoW).</p>
        </sec>
        <sec>
          <title>Processing Step, Developing a Classification Model</title>
          <p>We fit a linear regression model to the BoW as an independent variable and the document label of 0 versus 1 as a dependent variable. To develop the model, we used K-fold cross-validation, with K=10. The goal of cross-validation is to test an approach's ability to predict new notes not used in training to avoid problems such as overfitting or selection bias [<xref ref-type="bibr" rid="ref14">14</xref>]. In the 10-fold cross-validation, we randomly split our dataset into 10 equal sections [<xref ref-type="bibr" rid="ref15">15</xref>]. We trained a model with 9 splits, and we validated the performance of the model on the remaining split. The process was repeated 10 times, and the average performance is reported.</p>
        </sec>
        <sec>
          <title>Postprocessing Step</title>
          <p>We tested each model using a validation cohort, using the model with the highest performance as compared to the chart review (validation of the model). To evaluate the performance of the NLP model in training, validation, and test phases, we used sensitivity or recall, specificity, accuracy, positive predictive value or precision, negative predictive value, and area under the curve [<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref17">17</xref>]. To further validate the NLP approach, we compared its performance to an approach that used a simple search term assessment for the 2 expressions: “goal” and “value.”</p>
        </sec>
      </sec>
      <sec>
        <title>PPC Adoption</title>
        <p>As a second objective, we evaluated the adoption of PPC among trained social workers. We counted the number of yes-PPC notes in each month, and we created a time series of notes identified by the PPC algorithm. The x axis shows the month, and the y axis shows the number of documented notes with PPC language in the EHR. This evaluation helped to understand the implementation of the PPC approach among social workers who received formal training and the persistence of PPC adoption over time.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Data</title>
        <p>We collected 778 notes that had “goal” and “value” within their text. These notes were collected from 658 patients from 17 VA facilities by 82 social workers. Mean patient age was 70.4 years (SD 15.2 years), 91.6% (603/658) were male, 23.4% (154/658) had all-cause-of-mortality recorded, 91.8% (604/658) were of “Not Hispanic or Latino” ethnicity, 71.9% (473/658) were White, 6.7% (44/658) were “Black or African American,” and 47.4% (312/658) were married.</p>
        <p>The 2 reviewers disagreed on 54 notes and agreed on 724 (724/778, 93.1%) notes. The level of agreement after removing the chance effect was reduced to 82% (kappa=0.820, standard error 0.023, <italic>P</italic>&#60;.001).</p>
      </sec>
      <sec>
        <title>Model Performance</title>
        <p>The performance of the NLP model is shown in <xref ref-type="table" rid="table1">Table 1</xref>. The NLP model performance was calculated over notes (N=778) that had “goal” and “value” in their text. In the 10-fold cross-validation, the model validation reached an average of 0.92 (95% CI 0.90-0.94) for accuracy, 0.84 (95% CI 0.79-0.89) for sensitivity, 0.95 (95% CI 0.92-0.97) for specificity, 0.84 (95% CI 0.77-0.91) for the positive predictive value, and 0.95 (95% CI 0.93-0.96) for the negative predictive value.</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Comparison of chart-reviewed, free-text notes and natural language processing (NLP) model for the training and validation.</p>
          </caption>
          <table border="1" rules="groups" cellpadding="5" frame="hsides" width="1000" cellspacing="0">
            <col width="300"/>
            <col width="350"/>
            <col width="350"/>
            <thead>
              <tr valign="top">
                <td>Parameters</td>
                <td>Training, mean (95% CI)<sup>a</sup></td>
                <td>Validation, mean (95% CI)<sup>a</sup></td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Accuracy</td>
                <td>0.98 (0.98-0.99)</td>
                <td>0.92 (0.90-0.94)</td>
              </tr>
              <tr valign="top">
                <td>Sensitivity or recall</td>
                <td>0.98 (0.98-0.99)</td>
                <td>0.84 (0.79-0.89)</td>
              </tr>
              <tr valign="top">
                <td>Specificity</td>
                <td>0.99 (0.98-0.99)</td>
                <td>0.95 (0.92-0.97)</td>
              </tr>
              <tr valign="top">
                <td>Positive predictive values or precision</td>
                <td>0.98 (0.97-1.00)</td>
                <td>0.84 (0.77-0.91)</td>
              </tr>
              <tr valign="top">
                <td>Negative predictive value</td>
                <td>0.99 (0.98-0.99)</td>
                <td>0.95 (0.93-0.96)</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>Reported for 10-fold cross validation.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>In contrast, an approach using simple search terms (“goal” and “value”) applied to large text performed less well. The total number of notes that the social workers produced was 106,505. <xref ref-type="table" rid="table2">Table 2</xref> describes the precision of this model. The precision of the NLP model was &#62;0.99, while the precision of the simple search terms was 0.7571. In the other words, the simple search terms method falsely recognized 1 out of 4 notes as PPC.</p>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Comparison of the natural language processing (NLP) model and simple search terms on all 106,505 notes.</p>
          </caption>
          <table border="1" rules="groups" cellpadding="5" frame="hsides" width="1000" cellspacing="0">
            <col width="300"/>
            <col width="350"/>
            <col width="350"/>
            <thead>
              <tr valign="top">
                <td>Parameters</td>
                <td>Search terms</td>
                <td>NLP model</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Accuracy</td>
                <td>0.9982</td>
                <td>0.9999</td>
              </tr>
              <tr valign="top">
                <td>Sensitivity or recall</td>
                <td>1.0000</td>
                <td>0.9999</td>
              </tr>
              <tr valign="top">
                <td>Specificity</td>
                <td>0.9982</td>
                <td>0.9983</td>
              </tr>
              <tr valign="top">
                <td>Positive predictive values or precision</td>
                <td>0.7571</td>
                <td>1.0000</td>
              </tr>
              <tr valign="top">
                <td>Negative predictive value</td>
                <td>1.0000</td>
                <td>0.9849</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <p><xref rid="figure2" ref-type="fig">Figure 2</xref> describes the adoption of PPC within the notes of trained social workers over time. The 2 peaks represent the times immediately following training of social workers to use PPC. <xref rid="figure2" ref-type="fig">Figure 2</xref> also demonstrates that several months following the cessation of training, the persistence of PPC adoption declined. The NLP algorithm was useful in tracking PPC adoption over time.</p>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Monthly report of the number of Patient Priorities Care (PPC) encounters documented in the patients’ free-text notes in the Veterans Administration (VA) electronic health records; the 2 peaks are associated with training of social workers to use PPC.</p>
          </caption>
          <graphic xlink:href="medinform_v9i2e18756_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>Our results demonstrate that an NLP algorithm was highly accurate in identifying patients’ free-text notes with PPC language. Such a design has shown promise in previous work identifying risk factors for heart disease [<xref ref-type="bibr" rid="ref18">18</xref>]. The NLP model had a high performance of 0.84 in validation, and its precision was higher than an approach using only simple search terms. The NLP algorithm was also able to capture peaks in PPC adoption following social worker training and the eventual decline in PPC adoption over time. Such a tool may be used to monitor the overall implementation of interventions like PPC among trained social workers and to adjust the training process.</p>
        <p>While this NLP model performed well, model performance (precision and recall) could improve with the use of more complex strategies such as utilizing bigram or n-gram BoW, other sophisticated feature extractions (eg, graph mining [<xref ref-type="bibr" rid="ref19">19</xref>]), and nonlinear models (eg, deep learning [<xref ref-type="bibr" rid="ref20">20</xref>]). To reduce the computational cost of developing and implementing a model to test the use of PPC by trained facilitators, we propose the NLP model as a method that reduces the time and cost with other methods of assessment. Further development of this model will offer assessment with more precision. Despite these limitations, the NLP model performed better than the simple search term method, which had a 1-in-4 notes rate of misclassification.</p>
        <p>This study opens 3 new avenues for further investigation. By identifying PPC notes, we can longitudinally assess care for patients throughout VA facilities and understand changes in health care delivered after PPC encounters [<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref21">21</xref>]. We can identify patterns and consistency in how social workers and other clinicians document patient priorities over the course of multiple interactions with patients [<xref ref-type="bibr" rid="ref3">3</xref>]. By further expanding the NLP algorithm, we can also examine common priorities among our patient population and increase clinician, patient, and caregiver awareness of priorities recorded in the EHR. For successful implementation of PPC, we must assess other factors that play roles in the successful implementation of PPC, such as resource availability, adoption of PPC on a provider and facility level, and readiness of clinicians for implementation [<xref ref-type="bibr" rid="ref4">4</xref>]. We can also use sociodemographic data to pinpoint the ways individual characteristics of patients might influence the implementation of PPC by clinicians. We can also provide individualized feedback to each clinician to enhance their patient engagement process. Using this algorithm, we can measure long-term outcomes of interest, such as mortality and independent living.</p>
      </sec>
      <sec>
        <title>Implications</title>
        <p>This study achieved its overall objective of developing a simple NLP model to identify free-text notes that show evidence of documented patient priorities as part of the PPC process. Our NLP model complements PPC by measuring the extent to which social workers trained in PPC identify and document patient priorities. The NLP model can enable trainers to provide feedback on the implementation of PPC in the EHR. Additionally, this method can analyze the free text of any note for documentation of patient priorities generally in an effort to link those documented priorities with many patient outcomes without requiring labor-intensive methods for individual chart review.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Note template provided to the social workers during online training.</p>
        <media xlink:href="medinform_v9i2e18756_app1.png" xlink:title="PNG File , 607 KB"/>
      </supplementary-material>
      <supplementary-material id="app2">
        <label>Multimedia Appendix 2</label>
        <p>Visualization of each word in the Patient Priorities Care (PPC) notes, with the importance based on frequency.</p>
        <media xlink:href="medinform_v9i2e18756_app2.png" xlink:title="PNG File , 389 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">BoW</term>
          <def>
            <p>bag-of-words</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">EHR</term>
          <def>
            <p>electronic health record</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">MCC</term>
          <def>
            <p>multiple chronic conditions</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">NLP</term>
          <def>
            <p>natural language processing</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">PACT</term>
          <def>
            <p>Patient Aligned Care Teams</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">PPC</term>
          <def>
            <p>Patient Priorities Care</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">VHA</term>
          <def>
            <p>Veterans Health Administration</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>This research was funded by the Department of Veterans Affairs, Office of Rural Health and Geriatrics and Extended Care Central Office; and the Center for Innovations in Quality, Effectiveness and Safety (CIN 13-413) at the Michael E. DeBakey VA Medical Center, Houston, TX. JR receives support from the Big Data-Scientist Training Enhancement Program (BD-STEP) at the Department of Veterans Affairs and National Cancer Institute.</p>
    </ack>
    <fn-group>
      <fn fn-type="con">
        <p>AN and JR had full access to all of the data in the study and take responsibility for the integrity of the data and the accuracy of the data analysis. AN and JR conceived and designed the study. JR, AN, and LD acquired, analyzed, and interpreted the data. JR and JF drafted the manuscript. JV performed the statistical analysis. AN obtained funding. JR, AN, LD, JH, and JS critically revised the manuscript for important intellectual content. JF, LK, EO, JH, and JS provided administrative, technical, or material support. AN and LD supervised the study.</p>
      </fn>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ferris</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Blaum</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Kiwak</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Austin</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Esterson</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Harkless</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Oftedahl</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Parchman</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Van Ness</surname>
              <given-names>PH</given-names>
            </name>
            <name name-style="western">
              <surname>Tinetti</surname>
              <given-names>ME</given-names>
            </name>
          </person-group>
          <article-title>Perspectives of Patients, Clinicians, and Health System Leaders on Changes Needed to Improve the Health Care and Outcomes of Older Adults With Multiple Chronic Conditions</article-title>
          <source>J Aging Health</source>
          <year>2018</year>
          <month>06</month>
          <day>01</day>
          <volume>30</volume>
          <issue>5</issue>
          <fpage>778</fpage>
          <lpage>799</lpage>
          <pub-id pub-id-type="doi">10.1177/0898264317691166</pub-id>
          <pub-id pub-id-type="medline">28553806</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tinetti</surname>
              <given-names>ME</given-names>
            </name>
            <name name-style="western">
              <surname>Esterson</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Ferris</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Posner</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Blaum</surname>
              <given-names>CS</given-names>
            </name>
          </person-group>
          <article-title>Patient Priority-Directed Decision Making and Care for Older Adults with Multiple Chronic Conditions</article-title>
          <source>Clin Geriatr Med</source>
          <year>2016</year>
          <month>05</month>
          <volume>32</volume>
          <issue>2</issue>
          <fpage>261</fpage>
          <lpage>75</lpage>
          <pub-id pub-id-type="doi">10.1016/j.cger.2016.01.012</pub-id>
          <pub-id pub-id-type="medline">27113145</pub-id>
          <pub-id pub-id-type="pii">S0749-0690(16)00013-6</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tinetti</surname>
              <given-names>ME</given-names>
            </name>
            <name name-style="western">
              <surname>Naik</surname>
              <given-names>AD</given-names>
            </name>
            <name name-style="western">
              <surname>Dindo</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Costello</surname>
              <given-names>DM</given-names>
            </name>
            <name name-style="western">
              <surname>Esterson</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Geda</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Rosen</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Hernandez-Bigos</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>CD</given-names>
            </name>
            <name name-style="western">
              <surname>Ouellet</surname>
              <given-names>GM</given-names>
            </name>
            <name name-style="western">
              <surname>Kang</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Blaum</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Association of Patient Priorities-Aligned Decision-Making With Patient Outcomes and Ambulatory Health Care Burden Among Older Adults With Multiple Chronic Conditions: A Nonrandomized Clinical Trial</article-title>
          <source>JAMA Intern Med</source>
          <year>2019</year>
          <month>10</month>
          <day>07</day>
          <volume>179</volume>
          <issue>12</issue>
          <fpage>1688</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/31589281"/>
          </comment>
          <pub-id pub-id-type="doi">10.1001/jamainternmed.2019.4235</pub-id>
          <pub-id pub-id-type="medline">31589281</pub-id>
          <pub-id pub-id-type="pii">2752365</pub-id>
          <pub-id pub-id-type="pmcid">PMC6784811</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Blaum</surname>
              <given-names>CS</given-names>
            </name>
            <name name-style="western">
              <surname>Rosen</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Naik</surname>
              <given-names>AD</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>CD</given-names>
            </name>
            <name name-style="western">
              <surname>Dindo</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Vo</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Hernandez-Bigos</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Esterson</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Geda</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ferris</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Costello</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Acampora</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Meehan</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Tinetti</surname>
              <given-names>ME</given-names>
            </name>
          </person-group>
          <article-title>Feasibility of Implementing Patient Priorities Care for Older Adults with Multiple Chronic Conditions</article-title>
          <source>J Am Geriatr Soc</source>
          <year>2018</year>
          <month>10</month>
          <day>03</day>
          <volume>66</volume>
          <issue>10</issue>
          <fpage>2009</fpage>
          <lpage>2016</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/30281777"/>
          </comment>
          <pub-id pub-id-type="doi">10.1111/jgs.15465</pub-id>
          <pub-id pub-id-type="medline">30281777</pub-id>
          <pub-id pub-id-type="pmcid">PMC7015118</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Naik</surname>
              <given-names>AD</given-names>
            </name>
            <name name-style="western">
              <surname>Dindo</surname>
              <given-names>LN</given-names>
            </name>
            <name name-style="western">
              <surname>Van Liew</surname>
              <given-names>JR</given-names>
            </name>
            <name name-style="western">
              <surname>Hundt</surname>
              <given-names>NE</given-names>
            </name>
            <name name-style="western">
              <surname>Vo</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Hernandez-Bigos</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Esterson</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Geda</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Rosen</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Blaum</surname>
              <given-names>CS</given-names>
            </name>
            <name name-style="western">
              <surname>Tinetti</surname>
              <given-names>ME</given-names>
            </name>
          </person-group>
          <article-title>Development of a Clinically Feasible Process for Identifying Individual Health Priorities</article-title>
          <source>J Am Geriatr Soc</source>
          <year>2018</year>
          <month>10</month>
          <day>03</day>
          <volume>66</volume>
          <issue>10</issue>
          <fpage>1872</fpage>
          <lpage>1879</lpage>
          <pub-id pub-id-type="doi">10.1111/jgs.15437</pub-id>
          <pub-id pub-id-type="medline">30281794</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Freytag</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Dindo</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Catic</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>AL</given-names>
            </name>
            <name name-style="western">
              <surname>Bush Amspoker</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Gravier</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Dawson</surname>
              <given-names>DB</given-names>
            </name>
            <name name-style="western">
              <surname>Tinetti</surname>
              <given-names>ME</given-names>
            </name>
            <name name-style="western">
              <surname>Naik</surname>
              <given-names>AD</given-names>
            </name>
          </person-group>
          <article-title>Feasibility of Clinicians Aligning Health Care with Patient Priorities in Geriatrics Ambulatory Care</article-title>
          <source>J Am Geriatr Soc</source>
          <year>2020</year>
          <month>09</month>
          <day>20</day>
          <volume>68</volume>
          <issue>9</issue>
          <fpage>2112</fpage>
          <lpage>2116</lpage>
          <pub-id pub-id-type="doi">10.1111/jgs.16662</pub-id>
          <pub-id pub-id-type="medline">32687218</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Naik</surname>
              <given-names>AD</given-names>
            </name>
            <name name-style="western">
              <surname>Martin</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Moye</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Karel</surname>
              <given-names>MJ</given-names>
            </name>
          </person-group>
          <article-title>Health Values and Treatment Goals of Older, Multimorbid Adults Facing Life-Threatening Illness</article-title>
          <source>J Am Geriatr Soc</source>
          <year>2016</year>
          <month>03</month>
          <day>21</day>
          <volume>64</volume>
          <issue>3</issue>
          <fpage>625</fpage>
          <lpage>31</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/27000335"/>
          </comment>
          <pub-id pub-id-type="doi">10.1111/jgs.14027</pub-id>
          <pub-id pub-id-type="medline">27000335</pub-id>
          <pub-id pub-id-type="pmcid">PMC5001155</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Karel</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Mulligan</surname>
              <given-names>EA</given-names>
            </name>
            <name name-style="western">
              <surname>Walder</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Martin</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Moye</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Naik</surname>
              <given-names>AD</given-names>
            </name>
          </person-group>
          <article-title>Valued life abilities among veteran cancer survivors</article-title>
          <source>Health Expect</source>
          <year>2016</year>
          <month>06</month>
          <day>29</day>
          <volume>19</volume>
          <issue>3</issue>
          <fpage>679</fpage>
          <lpage>90</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/25645124"/>
          </comment>
          <pub-id pub-id-type="doi">10.1111/hex.12343</pub-id>
          <pub-id pub-id-type="medline">25645124</pub-id>
          <pub-id pub-id-type="pmcid">PMC4869069</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kowsari</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Jafari Meimandi</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Heidarysafa</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Mendu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Barnes</surname>
              <given-names>LE</given-names>
            </name>
            <name name-style="western">
              <surname>Brown</surname>
              <given-names>DE</given-names>
            </name>
          </person-group>
          <article-title>Text Classification Algorithms: A Survey</article-title>
          <source>Information</source>
          <year>2019</year>
          <month>04</month>
          <day>23</day>
          <volume>10</volume>
          <issue>4</issue>
          <fpage>150</fpage>
          <pub-id pub-id-type="doi">10.3390/info10040150</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Carrell</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Halgrim</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Tran</surname>
              <given-names>DT</given-names>
            </name>
            <name name-style="western">
              <surname>Buist</surname>
              <given-names>DSM</given-names>
            </name>
            <name name-style="western">
              <surname>Chubak</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chapman</surname>
              <given-names>WW</given-names>
            </name>
            <name name-style="western">
              <surname>Savova</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Using natural language processing to improve efficiency of manual chart abstraction in research: the case of breast cancer recurrence</article-title>
          <source>Am J Epidemiol</source>
          <year>2014</year>
          <month>03</month>
          <day>15</day>
          <volume>179</volume>
          <issue>6</issue>
          <fpage>749</fpage>
          <lpage>58</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/24488511"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/aje/kwt441</pub-id>
          <pub-id pub-id-type="medline">24488511</pub-id>
          <pub-id pub-id-type="pii">kwt441</pub-id>
          <pub-id pub-id-type="pmcid">PMC3939853</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Rastegar-Mojarad</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Moon</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Shen</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Afzal</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zeng</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Mehrabi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Sohn</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Clinical information extraction applications: A literature review</article-title>
          <source>J Biomed Inform</source>
          <year>2018</year>
          <month>01</month>
          <volume>77</volume>
          <fpage>34</fpage>
          <lpage>49</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(17)30256-3"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2017.11.011</pub-id>
          <pub-id pub-id-type="medline">29162496</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(17)30256-3</pub-id>
          <pub-id pub-id-type="pmcid">PMC5771858</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Koleck</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Dreisbach</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Bourne</surname>
              <given-names>PE</given-names>
            </name>
            <name name-style="western">
              <surname>Bakken</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Natural language processing of symptoms documented in free-text narratives of electronic health records: a systematic review</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2019</year>
          <month>04</month>
          <day>01</day>
          <volume>26</volume>
          <issue>4</issue>
          <fpage>364</fpage>
          <lpage>379</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/30726935"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamia/ocy173</pub-id>
          <pub-id pub-id-type="medline">30726935</pub-id>
          <pub-id pub-id-type="pii">5307912</pub-id>
          <pub-id pub-id-type="pmcid">PMC6657282</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Begoli</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Kistler</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Bates</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Towards a heterogeneous, polystore-like data architecture for the US Department of Veteran Affairs (VA) enterprise analytics</article-title>
          <year>2017</year>
          <conf-name>2016 IEEE International Conference on Big Data</conf-name>
          <conf-date>December 5-8, 2016</conf-date>
          <conf-loc>Washington, DC</conf-loc>
          <pub-id pub-id-type="doi">10.1109/bigdata.2016.7840896</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cawley</surname>
              <given-names>GC</given-names>
            </name>
            <name name-style="western">
              <surname>Talbot</surname>
              <given-names>NLC</given-names>
            </name>
          </person-group>
          <article-title>On over-fitting in model selection and subsequent selection bias in performance evaluation</article-title>
          <source>Journal of Machine Learning Research</source>
          <year>2010</year>
          <volume>11</volume>
          <fpage>2079</fpage>
          <lpage>2107</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chicco</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Ten quick tips for machine learning in computational biology</article-title>
          <source>BioData Min</source>
          <year>2017</year>
          <month>12</month>
          <day>8</day>
          <volume>10</volume>
          <issue>1</issue>
          <fpage>35</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://biodatamining.biomedcentral.com/articles/10.1186/s13040-017-0155-3"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s13040-017-0155-3</pub-id>
          <pub-id pub-id-type="medline">29234465</pub-id>
          <pub-id pub-id-type="pii">155</pub-id>
          <pub-id pub-id-type="pmcid">PMC5721660</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Meystre</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Haug</surname>
              <given-names>PJ</given-names>
            </name>
          </person-group>
          <article-title>Natural language processing to extract medical problems from electronic clinical documents: performance evaluation</article-title>
          <source>J Biomed Inform</source>
          <year>2006</year>
          <month>12</month>
          <volume>39</volume>
          <issue>6</issue>
          <fpage>589</fpage>
          <lpage>99</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(05)00114-0"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2005.11.004</pub-id>
          <pub-id pub-id-type="medline">16359928</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(05)00114-0</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ly</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Pamer</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Dang</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Brajovic</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Haider</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Botsis</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Milward</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Winter</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Ball</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Evaluation of Natural Language Processing (NLP) systems to annotate drug product labeling with MedDRA terminology</article-title>
          <source>J Biomed Inform</source>
          <year>2018</year>
          <month>07</month>
          <volume>83</volume>
          <fpage>73</fpage>
          <lpage>86</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(18)30106-0"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2018.05.019</pub-id>
          <pub-id pub-id-type="medline">29860093</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(18)30106-0</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Garibaldi</surname>
              <given-names>JM</given-names>
            </name>
          </person-group>
          <article-title>A hybrid model for automatic identification of risk factors for heart disease</article-title>
          <source>J Biomed Inform</source>
          <year>2015</year>
          <month>12</month>
          <volume>58 Suppl</volume>
          <fpage>S171</fpage>
          <lpage>82</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(15)00199-9"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2015.09.006</pub-id>
          <pub-id pub-id-type="medline">26375492</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(15)00199-9</pub-id>
          <pub-id pub-id-type="pmcid">PMC4989091</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Madan</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Szostak</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Komandur Elayavilli</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Tsai</surname>
              <given-names>RTH</given-names>
            </name>
            <name name-style="western">
              <surname>Ali</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Qian</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Rastegar-Mojarad</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Hoeng</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Fluck</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>The extraction of complex relationships and their conversion to biological expression language (BEL) overview of the BioCreative VI (2017) BEL track</article-title>
          <source>Database (Oxford)</source>
          <year>2019</year>
          <month>01</month>
          <day>01</day>
          <volume>2019</volume>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://academic.oup.com/database/article-lookup/doi/10.1093/database/baz084"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/database/baz084</pub-id>
          <pub-id pub-id-type="medline">31603193</pub-id>
          <pub-id pub-id-type="pii">5585579</pub-id>
          <pub-id pub-id-type="pmcid">PMC6787548</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Weng</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Wagholikar</surname>
              <given-names>KB</given-names>
            </name>
            <name name-style="western">
              <surname>McCray</surname>
              <given-names>AT</given-names>
            </name>
            <name name-style="western">
              <surname>Szolovits</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Chueh</surname>
              <given-names>HC</given-names>
            </name>
          </person-group>
          <article-title>Medical subdomain classification of clinical notes using a machine learning-based natural language processing approach</article-title>
          <source>BMC Med Inform Decis Mak</source>
          <year>2017</year>
          <month>12</month>
          <day>01</day>
          <volume>17</volume>
          <issue>1</issue>
          <fpage>155</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedinformdecismak.biomedcentral.com/articles/10.1186/s12911-017-0556-8"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12911-017-0556-8</pub-id>
          <pub-id pub-id-type="medline">29191207</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12911-017-0556-8</pub-id>
          <pub-id pub-id-type="pmcid">PMC5709846</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Feder</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kiwak</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Costello</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Dindo</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Hernandez-Bigos</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Vo</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Geda</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Blaum</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Tinetti</surname>
              <given-names>ME</given-names>
            </name>
            <name name-style="western">
              <surname>Naik</surname>
              <given-names>AD</given-names>
            </name>
          </person-group>
          <article-title>Perspectives of Patients in Identifying Their Values-Based Health Priorities</article-title>
          <source>J Am Geriatr Soc</source>
          <year>2019</year>
          <month>07</month>
          <volume>67</volume>
          <issue>7</issue>
          <fpage>1379</fpage>
          <lpage>1385</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/30844080"/>
          </comment>
          <pub-id pub-id-type="doi">10.1111/jgs.15850</pub-id>
          <pub-id pub-id-type="medline">30844080</pub-id>
          <pub-id pub-id-type="pmcid">PMC6612577</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
