<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR Med Inform</journal-id><journal-id journal-id-type="publisher-id">medinform</journal-id><journal-id journal-id-type="index">7</journal-id><journal-title>JMIR Medical Informatics</journal-title><abbrev-journal-title>JMIR Med Inform</abbrev-journal-title><issn pub-type="epub">2291-9694</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v12i1e57949</article-id><article-id pub-id-type="doi">10.2196/57949</article-id><article-categories><subj-group subj-group-type="heading"><subject>Original Paper</subject></subj-group></article-categories><title-group><article-title>Natural Language Processing Versus Diagnosis Code&#x2013;Based Methods for Postherpetic Neuralgia Identification: Algorithm Development and Validation</article-title></title-group><contrib-group><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Zheng</surname><given-names>Chengyi</given-names></name><degrees>MS, PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Ackerson</surname><given-names>Bradley</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Qiu</surname><given-names>Sijia</given-names></name><degrees>MS</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Sy</surname><given-names>Lina S</given-names></name><degrees>MPH</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Daily</surname><given-names>Leticia I Vega</given-names></name><degrees>MSW</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Song</surname><given-names>Jeannie</given-names></name><degrees>MPH</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Qian</surname><given-names>Lei</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Luo</surname><given-names>Yi</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Ku</surname><given-names>Jennifer H</given-names></name><degrees>MPH, PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Cheng</surname><given-names>Yanjun</given-names></name><degrees>MS</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Wu</surname><given-names>Jun</given-names></name><degrees>MS, MD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Tseng</surname><given-names>Hung Fu</given-names></name><degrees>MPH, PhD</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff3">3</xref></contrib></contrib-group><aff id="aff1"><institution>Department of Research &#x0026; Evaluation, Kaiser Permanente Southern California</institution>, <addr-line>100 S Los Robles Ave, 2nd Floor</addr-line><addr-line>Pasadena</addr-line><addr-line>CA</addr-line>, <country>United States</country></aff><aff id="aff2"><institution>South Bay Medical Center, Kaiser Permanente Southern California</institution>, <addr-line>Harbor City</addr-line><addr-line>CA</addr-line>, <country>United States</country></aff><aff id="aff3"><institution>Kaiser Permanente Bernard J. Tyson School of Medicine</institution>, <addr-line>Pasadena</addr-line><addr-line>CA</addr-line>, <country>United States</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Chen</surname><given-names>Qingyu</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Hosny</surname><given-names>Ahmed</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Kawai</surname><given-names>Kosuke</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Chengyi Zheng, MS, PhD, Department of Research &#x0026; Evaluation, Kaiser Permanente Southern California, 100 S Los Robles Ave, 2nd Floor, Pasadena, 91101, CA, United States, 1 6269868665, 1 626-564-7872; <email>chengyi.x.zheng@kp.org</email></corresp></author-notes><pub-date pub-type="collection"><year>2024</year></pub-date><pub-date pub-type="epub"><day>10</day><month>9</month><year>2024</year></pub-date><volume>12</volume><elocation-id>e57949</elocation-id><history><date date-type="received"><day>01</day><month>03</month><year>2024</year></date><date date-type="rev-recd"><day>02</day><month>07</month><year>2024</year></date><date date-type="accepted"><day>08</day><month>07</month><year>2024</year></date></history><copyright-statement>&#x00A9; Chengyi Zheng, Bradley Ackerson, Sijia Qiu, Lina S Sy, Leticia I Vega Daily, Jeannie Song, Lei Qian, Yi Luo, Jennifer H Ku, Yanjun Cheng, Jun Wu, Hung Fu Tseng. Originally published in JMIR Medical Informatics (<ext-link ext-link-type="uri" xlink:href="https://medinform.jmir.org">https://medinform.jmir.org</ext-link>), 10.9.2024. </copyright-statement><copyright-year>2024</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Informatics, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://medinform.jmir.org/">https://medinform.jmir.org/</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://medinform.jmir.org/2024/1/e57949"/><abstract><sec><title>Background</title><p>Diagnosis codes and prescription data are used in algorithms to identify postherpetic neuralgia (PHN), a debilitating complication of herpes zoster (HZ). Because of the questionable accuracy of codes and prescription data, manual chart review is sometimes used to identify PHN in electronic health records (EHRs), which can be costly and time-consuming.</p></sec><sec><title>Objective</title><p>This study aims to develop and validate a natural language processing (NLP) algorithm for automatically identifying PHN from unstructured EHR data and to compare its performance with that of code-based methods.</p></sec><sec sec-type="methods"><title>Methods</title><p>This retrospective study used EHR data from Kaiser Permanente Southern California, a large integrated health care system that serves over 4.8 million members. The source population included members aged &#x2265;50 years who received an incident HZ diagnosis and accompanying antiviral prescription between 2018 and 2020 and had &#x2265;1 encounter within 90&#x2010;180 days of the incident HZ diagnosis. The study team manually reviewed the EHR and identified PHN cases. For NLP development and validation, 500 and 800 random samples from the source population were selected, respectively. The sensitivity, specificity, positive predictive value (PPV), negative predictive value (NPV), F-score, and Matthews correlation coefficient (MCC) of NLP and the code-based methods were evaluated using chart-reviewed results as the reference standard.</p></sec><sec sec-type="results"><title>Results</title><p>The NLP algorithm identified PHN cases with a 90.9% sensitivity, 98.5% specificity, 82% PPV, and 99.3% NPV. The composite scores of the NLP algorithm were 0.89 (F-score) and 0.85 (MCC). The prevalences of PHN in the validation data were 6.9% (reference standard), 7.6% (NLP), and 5.4%&#x2010;13.1% (code-based). The code-based methods achieved a 52.7%&#x2010;61.8% sensitivity, 89.8%&#x2010;98.4% specificity, 27.6%&#x2010;72.1% PPV, and 96.3%&#x2010;97.1% NPV. The F-scores and MCCs ranged between 0.45 and 0.59 and between 0.32 and 0.61, respectively.</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>The automated NLP-based approach identified PHN cases from the EHR with good accuracy. This method could be useful in population-based PHN research.</p></sec></abstract><kwd-group><kwd>postherpetic neuralgia</kwd><kwd>herpes zoster</kwd><kwd>natural language processing</kwd><kwd>electronic health record</kwd><kwd>real-world data</kwd><kwd>artificial intelligence</kwd><kwd>development</kwd><kwd>validation</kwd><kwd>diagnosis</kwd><kwd>EHR</kwd><kwd>algorithm</kwd><kwd>EHR data</kwd><kwd>sensitivity</kwd><kwd>specificity</kwd><kwd>validation data</kwd><kwd>neuralgia</kwd><kwd>recombinant zoster vaccine</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>Herpes zoster (HZ) or shingles is a painful dermatomal vesicular disease that results from the reactivation of the latent varicella-zoster virus in the nerve ganglia [<xref ref-type="bibr" rid="ref1">1</xref>]. Nearly all adults have the varicella-zoster virus dormant in their nervous system [<xref ref-type="bibr" rid="ref2">2</xref>], and the estimated lifetime risk of HZ was approximately 30% prior to the availability of the zoster vaccine [<xref ref-type="bibr" rid="ref3">3</xref>]. HZ usually begins with a prodromal stage of discomfort, followed by a painful, itchy rash on one unilateral dermatome that lasts 2 to 4 weeks [<xref ref-type="bibr" rid="ref4">4</xref>]. Patients with HZ may develop postherpetic neuralgia (PHN)&#x2014;dermatomal pain persisting at least 90 days after the appearance of the acute HZ rash [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref5">5</xref>]. PHN is the most common complication of HZ and greatly lowers patients&#x2019; quality of life [<xref ref-type="bibr" rid="ref3">3</xref>].</p><p>Population-based studies using real-world data are cost-effective ways to address many questions about PHN [<xref ref-type="bibr" rid="ref3">3</xref>]. However, accurately identifying PHN is difficult. Clinical trials rely on predetermined follow-up visits, which are difficult to replicate in real-world settings [<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref7">7</xref>]. Due to time and resource constraints, prospective studies have mainly been limited to hundreds of patients with HZ and smaller numbers of PHN cases [<xref ref-type="bibr" rid="ref3">3</xref>]. Retrospective studies of PHN have relied heavily on diagnosis codes [<xref ref-type="bibr" rid="ref8">8</xref>-<xref ref-type="bibr" rid="ref13">13</xref>], which lack accuracy [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref14">14</xref>], or manual chart review [<xref ref-type="bibr" rid="ref14">14</xref>-<xref ref-type="bibr" rid="ref16">16</xref>], which is costly and time-consuming. Moreover, despite the widespread use of code-based algorithms, only a few publications included PHN algorithm validation results [<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref10">10</xref>].</p><p>Natural language processing (NLP), a subfield of artificial intelligence, has been used to identify and extract information from unstructured clinical data. We previously developed NLP methods to identify HZ ophthalmicus and HZ ophthalmicus with eye involvement, which are also common HZ complications [<xref ref-type="bibr" rid="ref17">17</xref>,<xref ref-type="bibr" rid="ref18">18</xref>]. In this study, we developed and validated an NLP algorithm to identify PHN. Using manual chart-reviewed results as a reference standard, we compared the performance of the NLP algorithm with that of 5 previously published code-based algorithms.</p></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Setting</title><p>This study was conducted at Kaiser Permanente Southern California (KPSC), an integrated health care system with 16 hospitals and 197 medical offices that serves over 4.8 million members. The prepaid health plan incentivizes members to use services at KPSC facilities. The electronic health record (EHR) system at KPSC stores all aspects of member care, including sociodemographic characteristics, medical encounters, diagnoses, laboratory tests, pharmacy use, immunization records, membership history, and billing and claims.</p></sec><sec id="s2-2"><title>PHN Case Definition</title><p>PHN was defined as pain or discomfort consistent with the HZ episode &#x2265;90 days after the initial HZ diagnosis; the symptoms were at the location of the initial HZ rash and were not due to other obvious causes [<xref ref-type="bibr" rid="ref19">19</xref>-<xref ref-type="bibr" rid="ref21">21</xref>].</p></sec><sec id="s2-3"><title>Data Sets</title><p>This study used EHR data of patients aged &#x2265;50 years who each had an incident HZ diagnosis and associated antiviral prescription between 2018 and 2020 at KPSC. All patients had to have at least 1 year of membership prior to the index (incident HZ diagnosis) date so that comorbidities and health care use could be ascertained. Among patients with &#x2265;1 encounter during the 90&#x2010;180 days after the incident HZ diagnosis, trained research associates reviewed their EHRs based on the PHN abstraction instructions (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). An infectious disease physician (BKA) reviewed all possible or unclear cases. From these reviewed cases, we randomly selected 500 cases for NLP development and 800 cases for NLP validation. Because the NLP work was done concurrently with the manual review, the development data set was collected at an earlier stage, when the reviewed cohort had a greater proportion of Asian and recombinant zoster vaccine&#x2013;vaccinated patients.</p></sec><sec id="s2-4"><title>Reference Standard</title><p>Among the 800 cases in the validation data set, BKA reviewed 37 HZ cases that research associates had identified as unclear PHN cases. Because reviewers sometimes missed positive mentions of PHN, BKA rereviewed cases in the validation set where NLP results differed from reviewer results. Nine cases were corrected from negative to positive PHN. These manually reviewed results served as the reference standard for assessing the performance of PHN identification algorithms.</p></sec><sec id="s2-5"><title>NLP Algorithm Development</title><p>We developed the NLP algorithm based on our previous work [<xref ref-type="bibr" rid="ref17">17</xref>,<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref22">22</xref>-<xref ref-type="bibr" rid="ref26">26</xref>]. <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref> describes the steps for preprocessing text and generating nomenclature. We created the rule-based NLP algorithm using the Linguamatics I2E software (Linguamatics, an IQVIA company). Each note was searched at different levels: section (eg, &#x201C;Physical Exam,&#x201D; &#x201C;Assessment/Plan&#x201D;), cross-sentence, intrasentence, and phrase. A distance-based relationship algorithm was applied to identify related terms based on the number of words or sentences between them. The relationship search identified the words or phrases (eg, negated, uncertain, and hypothetical statements) that modified the concepts of interest.</p><p><xref ref-type="fig" rid="figure1">Figure 1</xref> depicts an overview of the NLP algorithm. We separated the extracted clinical texts into 3 time periods: index (acute HZ) period (&#x2212;7 to 21 d from incident HZ diagnosis date), transitional (subacute HZ) period (22 to 89 d), and risk (defined PHN) period (90 to 180 d). We developed search queries to identify the HZ anatomic locations in the index episode and PHN-related evidence in the transitional and risk periods. Supporting evidence of PHN included explicit mention of ongoing PHN, symptom location and causality, and PHN listed in the assessment and plan section. Counterevidence of PHN included differential diagnoses, recurrent HZ, and resolved PHN. We excluded sections and statements that may have been copied forward as historical information.</p><p>The PHN decision algorithm was implemented in Python language, which incorporated the evidence from the NLP search queries and classified each case based on decision rules. To exclude the copy-pasted results, the NLP program ran search queries on both the transitional and risk periods and compared the results to locate identical sequences of text. The algorithm considered the time sequences of identified evidence. The symptom location during the risk period was compared with the index HZ location. Because adjacent dermatomes might be difficult to distinguish clinically, symptom location during the index and risk periods had to occur in the same or surrounding dermatomes (eg, face and neck). Based on the development data set, we tested and updated the algorithm.</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>Diagram of NLP algorithm. HZ: herpes zoster; NLP: natural language processing; PHN: postherpetic neuralgia.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v12i1e57949_fig01.png"/></fig></sec><sec id="s2-6"><title>Implementation of Published PHN Identification Algorithms</title><p>We selected and implemented 5 code-based PHN identification algorithms based on the variety of their algorithms, the journal category and impact factor, the publication year, the total citations, and the size of the study (<xref ref-type="table" rid="table1">Table 1</xref>). The first code-based method (C1: Yanni et al [<xref ref-type="bibr" rid="ref27">27</xref>]) exclusively used PHN-related diagnosis codes (<xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref>). The remaining 4 algorithms (C2: Klompas et al [<xref ref-type="bibr" rid="ref8">8</xref>]; C3: Klein et al [<xref ref-type="bibr" rid="ref10">10</xref>]; C4: Forbes et al [<xref ref-type="bibr" rid="ref9">9</xref>]; C5: Munoz-Quiles et al [<xref ref-type="bibr" rid="ref11">11</xref>]) used additional structured data, such as diagnosis codes for HZ, neuralgia, and chronic pain; prescriptions for analgesics, antidepressants, and anticonvulsants; and clinical visit data.</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>List of sources for selected code-based methods.</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Method</td><td align="left" valign="bottom">Herpes zoster cases, n</td><td align="left" valign="bottom">Journal category</td><td align="left" valign="bottom">Journal (IF<sup><xref ref-type="table-fn" rid="table1fn1">a</xref></sup>)</td><td align="left" valign="bottom">Year</td><td align="left" valign="bottom">TC<sup><xref ref-type="table-fn" rid="table1fn2">b</xref></sup></td></tr></thead><tbody><tr><td align="left" valign="top">C1 [<xref ref-type="bibr" rid="ref27">27</xref>]</td><td align="left" valign="top">21,146</td><td align="left" valign="top">General medicine</td><td align="left" valign="top">BMJ Open (2.9)</td><td align="left" valign="top">2018</td><td align="left" valign="top">67</td></tr><tr><td align="left" valign="top">C2 [<xref ref-type="bibr" rid="ref8">8</xref>]</td><td align="left" valign="top">2089</td><td align="left" valign="top">General medicine</td><td align="left" valign="top">Mayo Clinic Proceeding (8.9)</td><td align="left" valign="top">2011</td><td align="left" valign="top">125</td></tr><tr><td align="left" valign="top">C3 [<xref ref-type="bibr" rid="ref10">10</xref>]</td><td align="left" valign="top">62,205</td><td align="left" valign="top">Immunology</td><td align="left" valign="top">Vaccine (5.5)</td><td align="left" valign="top">2019</td><td align="left" valign="top">32</td></tr><tr><td align="left" valign="top">C4 [<xref ref-type="bibr" rid="ref9">9</xref>]</td><td align="left" valign="top">119,413</td><td align="left" valign="top">Neurology</td><td align="left" valign="top">Neurology (10.1)</td><td align="left" valign="top">2016</td><td align="left" valign="top">155</td></tr><tr><td align="left" valign="top">C5 [<xref ref-type="bibr" rid="ref11">11</xref>]</td><td align="left" valign="top">87,086</td><td align="left" valign="top">Infectious diseases</td><td align="left" valign="top">Journal of Infection (28.2)</td><td align="left" valign="top">2018</td><td align="left" valign="top">38</td></tr></tbody></table><table-wrap-foot><fn id="table1fn1"><p><sup>a</sup>IF: impact factor based on Journal Citation Report released in 2023.</p></fn><fn id="table1fn2"><p><sup>b</sup>TC: total citations based on Google Scholar as of July 1, 2024.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s2-7"><title>Validation and Analysis</title><p>The results generated from the various algorithms were evaluated against the chart-reviewed reference standard validation data set. We counted the numbers of true-positive (TP), false-positive (FP), true-negative (TN), and false-negative (FN) cases to calculate the performance metrics: sensitivity, specificity, positive predictive value (PPV), negative predictive value (NPV), F-score [<xref ref-type="bibr" rid="ref28">28</xref>], and Matthews correlation coefficient (MCC) [<xref ref-type="bibr" rid="ref29">29</xref>].</p><p>The F-score is a combination metric in machine learning and NLP research. It is defined as a weighted harmonic mean of sensitivity and PPV, where the parameter <inline-formula><mml:math id="ieqn1"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mi>&#x03B2;</mml:mi></mml:mrow></mml:mstyle></mml:math></inline-formula> represents the relative importance of sensitivity versus PPV.</p><disp-formula id="E1"><mml:math id="eqn1"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mrow><mml:mi mathvariant="normal">F</mml:mi><mml:mo>&#x2212;</mml:mo><mml:mi mathvariant="normal">s</mml:mi><mml:mi mathvariant="normal">c</mml:mi><mml:mi mathvariant="normal">o</mml:mi><mml:mi mathvariant="normal">r</mml:mi><mml:mi mathvariant="normal">e</mml:mi></mml:mrow><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:msup><mml:mi>&#x03B2;</mml:mi><mml:mrow><mml:mn>2</mml:mn></mml:mrow></mml:msup><mml:mo>+</mml:mo><mml:mn>1</mml:mn><mml:mo stretchy="false">)</mml:mo><mml:mspace width="thinmathspace"/><mml:mo>&#x2217;</mml:mo><mml:mspace width="thinmathspace"/><mml:mrow><mml:mi mathvariant="normal">P</mml:mi><mml:mi mathvariant="normal">P</mml:mi><mml:mi mathvariant="normal">V</mml:mi></mml:mrow><mml:mspace width="thinmathspace"/><mml:mo>&#x2217;</mml:mo><mml:mspace width="thinmathspace"/><mml:mrow><mml:mi mathvariant="normal">s</mml:mi><mml:mi mathvariant="normal">e</mml:mi><mml:mi mathvariant="normal">n</mml:mi><mml:mi mathvariant="normal">s</mml:mi><mml:mi mathvariant="normal">i</mml:mi><mml:mi mathvariant="normal">t</mml:mi><mml:mi mathvariant="normal">i</mml:mi><mml:mi mathvariant="normal">v</mml:mi><mml:mi mathvariant="normal">i</mml:mi><mml:mi mathvariant="normal">t</mml:mi><mml:mi mathvariant="normal">y</mml:mi></mml:mrow></mml:mrow><mml:mrow><mml:msup><mml:mi>&#x03B2;</mml:mi><mml:mrow><mml:mn>2</mml:mn></mml:mrow></mml:msup><mml:mo>&#x2217;</mml:mo><mml:mspace width="thinmathspace"/><mml:mrow><mml:mi mathvariant="normal">P</mml:mi><mml:mi mathvariant="normal">P</mml:mi><mml:mi mathvariant="normal">V</mml:mi></mml:mrow><mml:mspace width="thinmathspace"/><mml:mo>+</mml:mo><mml:mspace width="thinmathspace"/><mml:mrow><mml:mi mathvariant="normal">s</mml:mi><mml:mi mathvariant="normal">e</mml:mi><mml:mi mathvariant="normal">n</mml:mi><mml:mi mathvariant="normal">s</mml:mi><mml:mi mathvariant="normal">i</mml:mi><mml:mi mathvariant="normal">t</mml:mi><mml:mi mathvariant="normal">i</mml:mi><mml:mi mathvariant="normal">v</mml:mi><mml:mi mathvariant="normal">i</mml:mi><mml:mi mathvariant="normal">t</mml:mi><mml:mi mathvariant="normal">y</mml:mi></mml:mrow></mml:mrow></mml:mfrac></mml:mrow></mml:mstyle></mml:math></disp-formula><p>Since a minority of patients with HZ will develop PHN and FNs and sensitivity are more important than PPV, we chose <italic>&#x03B2;</italic>=2 to favor sensitivity over PPV. The F-score&#x2019;s value ranges from 0 to 1, with higher values suggesting better prediction. However, because the F-score does not include TN in its formula, MCC has been proposed as a better overall measurement than the F-score as well as the area under the receiver operating characteristic curve in binary classification [<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref30">30</xref>]. The MCC formula considers all 4 confusion matrix categories, with values between &#x2212;1 to 1, where &#x00B1;1 denotes perfect agreement or disagreement between actuals and predictions, and 0 indicates randomness.</p><disp-formula id="E2"><mml:math id="eqn2"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mrow><mml:mi mathvariant="normal">M</mml:mi><mml:mi mathvariant="normal">C</mml:mi><mml:mi mathvariant="normal">C</mml:mi><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mi mathvariant="normal">T</mml:mi><mml:mi mathvariant="normal">P</mml:mi><mml:mo>&#x2217;</mml:mo><mml:mi mathvariant="normal">T</mml:mi><mml:mi mathvariant="normal">N</mml:mi><mml:mo>&#x2212;</mml:mo><mml:mi mathvariant="normal">F</mml:mi><mml:mi mathvariant="normal">P</mml:mi><mml:mo>&#x2217;</mml:mo><mml:mi mathvariant="normal">F</mml:mi><mml:mi mathvariant="normal">N</mml:mi></mml:mrow><mml:msqrt><mml:mo stretchy="false">(</mml:mo><mml:mi mathvariant="normal">T</mml:mi><mml:mi mathvariant="normal">P</mml:mi><mml:mo>+</mml:mo><mml:mi mathvariant="normal">F</mml:mi><mml:mi mathvariant="normal">P</mml:mi><mml:mo stretchy="false">)</mml:mo><mml:mo>&#x2217;</mml:mo><mml:mo stretchy="false">(</mml:mo><mml:mi mathvariant="normal">T</mml:mi><mml:mi mathvariant="normal">P</mml:mi><mml:mo>+</mml:mo><mml:mi mathvariant="normal">F</mml:mi><mml:mi mathvariant="normal">N</mml:mi><mml:mo stretchy="false">)</mml:mo><mml:mo>&#x2217;</mml:mo><mml:mo stretchy="false">(</mml:mo><mml:mi mathvariant="normal">T</mml:mi><mml:mi mathvariant="normal">N</mml:mi><mml:mo>+</mml:mo><mml:mi mathvariant="normal">F</mml:mi><mml:mi mathvariant="normal">P</mml:mi><mml:mo stretchy="false">)</mml:mo><mml:mo>&#x2217;</mml:mo><mml:mo stretchy="false">(</mml:mo><mml:mi mathvariant="normal">T</mml:mi><mml:mi mathvariant="normal">N</mml:mi><mml:mo>+</mml:mo><mml:mi mathvariant="normal">F</mml:mi><mml:mi mathvariant="normal">N</mml:mi><mml:mo stretchy="false">)</mml:mo></mml:msqrt></mml:mfrac></mml:mrow></mml:mrow></mml:mstyle></mml:math></disp-formula><p>The prevalence proportion of PHN was calculated as the number of identified PHN cases per 100 cases of HZ.</p></sec><sec id="s2-8"><title>Ethical Considerations</title><p>The KPSC institutional review board approved this study (institutional review board number: 12270). A waiver of informed consent was granted for this study because this was a data-only minimal-risk study.</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>Study Population</title><p>The characteristics of the study population are presented in <xref ref-type="table" rid="table2">Table 2</xref>. The mean (SD) ages of the development and validation data sets were 69.5 (9.1) and 70.0 (9.8) years, respectively, with 329 (65.8%) and 542 (67.8%) being female. The development data set had a higher proportion of Asian (177/500, 35.4% vs 110/796, 13.8%) and recombinant zoster vaccine&#x2013;vaccinated patients (61/500, 12.2% vs 28/800, 3.5%). There were no significant differences between the development and validation data sets in terms of clinical visits and comorbidities prior to the index date. In the development and validation data sets, approximately one-third of the patients had diabetes (159/500, 31.8% and 262/796, 32.8%, respectively), while less than one-quarter had chronic pulmonary disease (88/500, 17.6% and 163/800, 20.4%) and depression (103/500, 20.6% and 189/800, 23.6%). The development data had a higher proportion of patients with cancer as compared with the validation data (52/500, 10.4% vs 54/800, 6.8%).</p><table-wrap id="t2" position="float"><label>Table 2.</label><caption><p>Characteristics of patients in the development and validation data sets.</p></caption><table id="table2" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom" colspan="2">Characteristics</td><td align="left" valign="bottom" colspan="2">Patients</td><td align="left" valign="bottom"><italic>P</italic> value<sup><xref ref-type="table-fn" rid="table2fn1">a</xref></sup></td></tr><tr><td align="left" valign="bottom" colspan="2"/><td align="left" valign="bottom">Development (n=500)</td><td align="left" valign="bottom">Validation (n=800)</td><td align="left" valign="bottom"/></tr></thead><tbody><tr><td align="left" valign="top" colspan="2">Age (year), mean (SD)</td><td align="left" valign="top">69.5 (9.1)</td><td align="left" valign="top">70.0 (9.8)</td><td align="left" valign="top">.47</td></tr><tr><td align="left" valign="top" colspan="4"><bold>Age group (years), n (%)</bold></td><td align="left" valign="top">.52</td></tr><tr><td align="left" valign="top"/><td align="char" char="." valign="top">50&#x2010;59</td><td align="left" valign="top">70 (14.0)</td><td align="left" valign="top">103 (12.9)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="char" char="." valign="top">60&#x2010;69</td><td align="left" valign="top">172 (34.4)</td><td align="left" valign="top">282 (35.3)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="char" char="." valign="top">70&#x2010;79</td><td align="left" valign="top">187 (37.4)</td><td align="left" valign="top">280 (35.0)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="char" char="." valign="top">&#x2265;80</td><td align="left" valign="top">71 (14.2)</td><td align="left" valign="top">135 (16.9)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top" colspan="4"><bold>Sex, n (%)</bold></td><td align="left" valign="top">.47</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Female</td><td align="left" valign="top">329 (65.8)</td><td align="left" valign="top">542 (67.8)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Male</td><td align="left" valign="top">171 (34.2)</td><td align="left" valign="top">258 (32.3)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top" colspan="4"><bold>Race or ethnicity, n (%)</bold></td><td align="left" valign="top">&#x003C;.01</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Non-Hispanic White</td><td align="left" valign="top">198 (39.6)</td><td align="left" valign="top">424 (53.0)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Hispanic</td><td align="left" valign="top">102 (20.4)</td><td align="left" valign="top">213 (26.6)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Asian/Pacific Islanders</td><td align="left" valign="top">177 (35.4)</td><td align="left" valign="top">110 (13.8)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Non-Hispanic Black</td><td align="left" valign="top">18 (3.6)</td><td align="left" valign="top">41 (5.1)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Other/Multiple/Unknown</td><td align="left" valign="top">5 (1.0)</td><td align="left" valign="top">12 (1.5)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top" colspan="4"><bold>Number of outpatient/digital visits 6 months before HZ</bold><sup><xref ref-type="table-fn" rid="table2fn2"><bold>b</bold></xref></sup> <bold>diagnosis date, n (%)</bold></td><td align="char" char="." valign="top">.91</td></tr><tr><td align="left" valign="top"/><td align="char" char="." valign="top">0&#x2010;1</td><td align="left" valign="top">68 (13.6)</td><td align="left" valign="top">106 (13.3)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="char" char="." valign="top">2&#x2010;5</td><td align="left" valign="top">168 (33.6)</td><td align="left" valign="top">262 (32.8)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="char" char="." valign="top">&#x2265;6</td><td align="left" valign="top">264 (52.8)</td><td align="left" valign="top">432 (54.0)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top" colspan="4"><bold>Number of emergency department visits 6 months before HZ diagnosis date, n (%)</bold></td><td align="char" char="." valign="top">.08</td></tr><tr><td align="left" valign="top"/><td align="char" char="." valign="top">0</td><td align="left" valign="top">420 (84.0)</td><td align="left" valign="top">641 (80.1)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="char" char="." valign="top">&#x2265;1</td><td align="left" valign="top">80 (16.0)</td><td align="left" valign="top">159 (19.9)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top" colspan="4"><bold>Number of hospitalizations 6 months before HZ diagnosis date, n (%)</bold></td><td align="char" char="." valign="top">.45</td></tr><tr><td align="left" valign="top"/><td align="char" char="." valign="top">0</td><td align="left" valign="top">475 (95.0)</td><td align="left" valign="top">752 (94.0)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="char" char="." valign="top">&#x2265;1</td><td align="left" valign="top">25 (5.0)</td><td align="left" valign="top">48 (6.0)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top" colspan="5"><bold>Comorbidity 1 year before HZ diagnosis date, n (%)</bold></td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Allergic rhinitis</td><td align="left" valign="top">38 (7.6)</td><td align="left" valign="top">51 (6.4)</td><td align="left" valign="top">.39</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Asthma</td><td align="left" valign="top">41 (8.2)</td><td align="left" valign="top">82 (10.3)</td><td align="left" valign="top">.22</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Atopic dermatitis</td><td align="left" valign="top">5 (1.0)</td><td align="left" valign="top">9 (1.1)</td><td align="left" valign="top">.83</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Cancer</td><td align="left" valign="top">52 (10.4)</td><td align="left" valign="top">54 (6.8)</td><td align="left" valign="top">.02</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Chronic pulmonary disease</td><td align="left" valign="top">88 (17.6)</td><td align="left" valign="top">163 (20.4)</td><td align="left" valign="top">.22</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Depression</td><td align="left" valign="top">103 (20.6)</td><td align="left" valign="top">189 (23.6)</td><td align="left" valign="top">.20</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Diabetes</td><td align="left" valign="top">159 (31.8)</td><td align="left" valign="top">262 (32.8)</td><td align="left" valign="top">.72</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Epilepsy and recurrent seizures</td><td align="left" valign="top">8 (1.6)</td><td align="left" valign="top">8 (1.0)</td><td align="left" valign="top">.34</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Heart failure</td><td align="left" valign="top">24 (4.8)</td><td align="left" valign="top">55 (6.9)</td><td align="left" valign="top">.13</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Rheumatoid arthritis</td><td align="left" valign="top">25 (5.0)</td><td align="left" valign="top">38 (4.8)</td><td align="left" valign="top">.84</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Systemic lupus erythematosus</td><td align="left" valign="top">6 (1.2)</td><td align="left" valign="top">6 (0.8)</td><td align="left" valign="top">.41</td></tr><tr><td align="left" valign="top" colspan="4"><bold>Recombinant zoster vaccine, n (%)</bold></td><td align="left" valign="top">&#x003C;.01</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Unvaccinated</td><td align="left" valign="top">439 (87.8)</td><td align="left" valign="top">772 (96.5)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="left" valign="top">1-dose vaccinated</td><td align="left" valign="top">32 (6.4)</td><td align="left" valign="top">9 (1.1)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Fully (2-dose) vaccinated</td><td align="left" valign="top">29 (5.8)</td><td align="left" valign="top">19 (2.4)</td><td align="left" valign="top"/></tr></tbody></table><table-wrap-foot><fn id="table2fn1"><p><sup>a</sup><italic>&#x03C7;</italic><sup>2</sup> test was used for categorical variables, and Wilcoxon test was used for continuous variables.</p></fn><fn id="table2fn2"><p><sup>b</sup>HZ: herpes zoster.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s3-2"><title>Validation Data Set</title><p>In the validation data set, the numbers of clinical notes in the index, transitional, and risk periods were 12,158, 14,446, and 18,895, respectively. The percentages of HZ- or PHN-relevant notes were 26.2%, 8.2%, and 3.2%, respectively for the index, transitional, and risk periods. Most of the HZ index visits occurred in primary care, urgent care, emergency departments, and hospital settings (<xref ref-type="supplementary-material" rid="app4">Multimedia Appendix 4</xref>). After the index period, HZ-related mentions were much less frequently documented in urgent care visit notes, but more frequently documented in specialist visit notes (41 specialties).</p></sec><sec id="s3-3"><title>Application of NLP on Validation Data Set</title><p>Out of the 800 patients in the validation data set, the NLP algorithm identified 796 patients with HZ who had at least 1 note with HZ- or PHN-related terms in the index period. Among the 4 remaining patients, 2 patients had their index HZ diagnosed outside KPSC and had no follow-up visits in the index period. For the remaining 2 patients, HZ-related symptoms were documented, but no mention of HZ or PHN was made in the clinical notes. Among these 796 patients, the NLP algorithm identified the HZ anatomic location for 751 (94.3%) patients, and among them, 611 (81.3%) had laterality information (<xref ref-type="supplementary-material" rid="app5">Multimedia Appendix 5</xref>). In the transitional and risk periods, the NLP algorithm identified positive mentions of any pain or discomfort in 370 (46.3%) and 425 (53.1%) patients, respectively.</p></sec><sec id="s3-4"><title>Validation Results</title><p>In the validation data set, the NLP algorithm achieved a 90.9% sensitivity, 98.5% specificity, 82% PPV, and 99.3% NPV (<xref ref-type="table" rid="table3">Table 3</xref>). The composite scores of the NLP algorithm were 0.89 (F-score) and 0.85 (MCC). Of the 800 patients in the validation data set, 55 (6.9%) were chart-confirmed as PHN. The prevalence proportion of PHN identified by the NLP algorithm was 7.6%.</p><table-wrap id="t3" position="float"><label>Table 3.</label><caption><p>Performance characteristics of natural language processing and code-based methods for identifying postherpetic neuralgia as compared with chart-confirmed reference standard.</p></caption><table id="table3" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Method</td><td align="left" valign="bottom">PHN<sup><xref ref-type="table-fn" rid="table3fn1">a</xref></sup> (%)</td><td align="left" valign="bottom">TP<sup><xref ref-type="table-fn" rid="table3fn2">b</xref></sup></td><td align="left" valign="bottom">TN<sup><xref ref-type="table-fn" rid="table3fn3">c</xref></sup></td><td align="left" valign="bottom">FN<sup><xref ref-type="table-fn" rid="table3fn4">d</xref></sup></td><td align="left" valign="bottom">FP<sup><xref ref-type="table-fn" rid="table3fn5">e</xref></sup></td><td align="left" valign="bottom">Sensitivity (%)</td><td align="left" valign="bottom">Specificity (%)</td><td align="left" valign="bottom">PPV<sup><xref ref-type="table-fn" rid="table3fn6">f</xref></sup> (%)</td><td align="left" valign="bottom">NPV<sup><xref ref-type="table-fn" rid="table3fn7">g</xref></sup> (%)</td><td align="left" valign="bottom">F-score</td><td align="left" valign="bottom">MCC<sup><xref ref-type="table-fn" rid="table3fn8">h</xref></sup></td></tr></thead><tbody><tr><td align="left" valign="top">NLP<sup><xref ref-type="table-fn" rid="table3fn9">i</xref></sup></td><td align="left" valign="top">7.6</td><td align="left" valign="top">50</td><td align="left" valign="top">734</td><td align="left" valign="top">5</td><td align="left" valign="top">11</td><td align="left" valign="top">90.9</td><td align="left" valign="top">98.5</td><td align="left" valign="top">82.0</td><td align="left" valign="top">99.3</td><td align="left" valign="top">0.89</td><td align="left" valign="top">0.85</td></tr><tr><td align="left" valign="top">C1</td><td align="left" valign="top">5.4</td><td align="left" valign="top">31</td><td align="left" valign="top">733</td><td align="left" valign="top">24</td><td align="left" valign="top">12</td><td align="left" valign="top">56.4</td><td align="left" valign="top">98.4</td><td align="left" valign="top">72.1</td><td align="left" valign="top">96.8</td><td align="left" valign="top">0.59</td><td align="left" valign="top">0.61</td></tr><tr><td align="left" valign="top">C2</td><td align="left" valign="top">10.9</td><td align="left" valign="top">34</td><td align="left" valign="top">692</td><td align="left" valign="top">21</td><td align="left" valign="top">53</td><td align="left" valign="top">61.8</td><td align="left" valign="top">92.9</td><td align="left" valign="top">39.1</td><td align="left" valign="top">97.1</td><td align="left" valign="top">0.55</td><td align="left" valign="top">0.44</td></tr><tr><td align="left" valign="top">C3</td><td align="left" valign="top">5.5</td><td align="left" valign="top">31</td><td align="left" valign="top">732</td><td align="left" valign="top">24</td><td align="left" valign="top">13</td><td align="left" valign="top">56.4</td><td align="left" valign="top">98.3</td><td align="left" valign="top">70.5</td><td align="left" valign="top">96.8</td><td align="left" valign="top">0.59</td><td align="left" valign="top">0.61</td></tr><tr><td align="left" valign="top">C4</td><td align="left" valign="top">13.1</td><td align="left" valign="top">29</td><td align="left" valign="top">669</td><td align="left" valign="top">26</td><td align="left" valign="top">76</td><td align="left" valign="top">52.7</td><td align="left" valign="top">89.8</td><td align="left" valign="top">27.6</td><td align="left" valign="top">96.3</td><td align="left" valign="top">0.45</td><td align="left" valign="top">0.32</td></tr><tr><td align="left" valign="top">C5</td><td align="left" valign="top">9.3</td><td align="left" valign="top">31</td><td align="left" valign="top">702</td><td align="left" valign="top">24</td><td align="left" valign="top">43</td><td align="left" valign="top">56.4</td><td align="left" valign="top">94.2</td><td align="left" valign="top">41.9</td><td align="left" valign="top">96.7</td><td align="left" valign="top">0.53</td><td align="left" valign="top">0.44</td></tr></tbody></table><table-wrap-foot><fn id="table3fn1"><p><sup>a</sup>PHN: postherpetic neuralgia.</p></fn><fn id="table3fn2"><p><sup>b</sup>TP: true-positive.</p></fn><fn id="table3fn3"><p><sup>c</sup>TN: true-negative.</p></fn><fn id="table3fn4"><p><sup>d</sup>FN: false-negative.</p></fn><fn id="table3fn5"><p><sup>e</sup>FP: false-positive.</p></fn><fn id="table3fn6"><p><sup>f</sup>PPV: positive predictive value.</p></fn><fn id="table3fn7"><p><sup>g</sup>NPV: negative predictive value.</p></fn><fn id="table3fn8"><p><sup>h</sup>MCC: Matthews correlation coefficient.</p></fn><fn id="table3fn9"><p><sup>i</sup>NLP: natural language processing.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s3-5"><title>Error Analysis of NLP Validation Results</title><p>Error analysis of the FN and FP cases is presented in <xref ref-type="table" rid="table4">Table 4</xref>. Some of the NLP-related errors were caused by the selection of data sources. For 2 FN cases, NLP incorrectly classified them as PHN negative when statements were found indicating HZ-associated pain had resolved even though additional evidence showed the patients still had other PHN-related symptoms. The FP cases were caused by copied-and-pasted text, incorrect causality attribution of symptoms, misclassified recurrent HZ cases as PHN, and unclear clinical documentation.</p><table-wrap id="t4" position="float"><label>Table 4.</label><caption><p>Error analysis of natural language processing false-negatives and false-positives.</p></caption><table id="table4" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom" colspan="2">Type of NLP<sup><xref ref-type="table-fn" rid="table4fn1">a</xref></sup> error</td><td align="left" valign="bottom">Description</td><td align="left" valign="bottom">Number of cases</td></tr></thead><tbody><tr><td align="left" valign="top" colspan="3"><bold>False-negative</bold></td><td align="char" char="." valign="top">5</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">EHR<sup><xref ref-type="table-fn" rid="table4fn2">b</xref></sup> data source</td><td align="left" valign="top"><list list-type="bullet"><list-item><p>Case 1: We did not include one free text table (formatted messages) from the Epic EHR.</p></list-item><list-item><p>Case 2: PHN<sup><xref ref-type="table-fn" rid="table4fn3">c</xref></sup> was mentioned in a clinical note from the hematology department, which was excluded from NLP processing.</p></list-item></list></td><td align="char" char="." valign="top">2</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Unclear documentation</td><td align="left" valign="top"><list list-type="bullet"><list-item><p>HZ<sup><xref ref-type="table-fn" rid="table4fn4">d</xref></sup> or PHN was not stated in the clinical note, which was required by NLP to reduce false-positive hits.</p></list-item></list></td><td align="char" char="." valign="top">1</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Symptom</td><td align="left" valign="top"><list list-type="bullet"><list-item><p>While the patient stated that HZ-associated pain had resolved, documents also indicated that the patient still had other PHN-related symptoms (prickling sensation and itchy).</p></list-item></list></td><td align="char" char="." valign="top">2</td></tr><tr><td align="left" valign="top" colspan="3"><bold>False-positive</bold></td><td align="char" char="." valign="top">11</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">EHR data source</td><td align="left" valign="top"><list list-type="bullet"><list-item><p>We included Epic&#x2019;s SmartData elements, which lacked specificity for PHN identification.</p></list-item></list></td><td align="char" char="." valign="top">2</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Unclear documentation</td><td align="left" valign="top"><list list-type="bullet"><list-item><p>In 2 cases, the text was copied from the clinical notes in the index period. The NLP copy-and-paste detection algorithm was only applied to the clinical notes in the transitional period.</p></list-item><list-item><p>In another 2 cases, PHN and PHN-related medications were listed in the assessment and plan sections. However, it was unclear whether the patient had ongoing symptoms.</p></list-item></list></td><td align="char" char="." valign="top">4</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Acute HZ</td><td align="left" valign="top"><list list-type="bullet"><list-item><p>NLP misclassified 2 acute HZ cases that occurred in the risk period as PHN.</p></list-item></list></td><td align="char" char="." valign="top">2</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Causality</td><td align="left" valign="top"><list list-type="bullet"><list-item><p>Case 1: Pain thought to be due to chalazion based on information in follow-up visits.</p></list-item><list-item><p>Case 2: PHN was listed in the assessment section and tramadol and gabapentin were listed in the plan section. However, the medications were likely for lumbosacral radiculopathy.</p></list-item></list></td><td align="char" char="." valign="top">2</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Symptom</td><td align="left" valign="top"><list list-type="bullet"><list-item><p>The patient reported generalized symptoms (nausea) since HZ, but there was no mention of concomitant sensory changes such as pain, thus the case did not meet our PHN definition.</p></list-item></list></td><td align="char" char="." valign="top">1</td></tr></tbody></table><table-wrap-foot><fn id="table4fn1"><p><sup>a</sup>NLP: natural language processing.</p></fn><fn id="table4fn2"><p><sup>b</sup>EHR: electronic health record.</p></fn><fn id="table4fn3"><p><sup>c</sup>PHN: postherpetic neuralgia.</p></fn><fn id="table4fn4"><p><sup>d</sup>HZ: herpes zoster.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s3-6"><title>Code-Based Methods</title><p>The prevalence proportions of PHN identified by code-based methods ranged from 5.4% to 13.1%. The code-based methods achieved a 52.7%&#x2010;61.8% sensitivity, 89.8%&#x2010;98.4% specificity, 27.6%&#x2010;72.1% PPV, and 96.3%&#x2010;97.1% NPV. The F-scores and MCCs ranged between 0.45 and 0.59 and between 0.32 and 0.61, respectively. The more sophisticated algorithms were no better than the PHN diagnosis code&#x2013;only method as measured by the F-score or MCC. Although each component of the code-based methods identified PHN cases, most of them did not contribute to identifying additional true PHN cases beyond those identified by PHN diagnosis codes, and those that did have much lower PPVs (C4.3: 10.3%, C4.2: 26.1% and C2.2: 37.7%) than the PHN diagnosis code&#x2013;only method (C1, PPV 72.1%) (<xref ref-type="table" rid="table5">Table 5</xref>). We re-reviewed all FP cases from code-based methods C1 and C3 and randomly sampled the remaining FP cases from approaches C2, C4, and C5. Among the 20 reviewed FP cases, we found that none were true PHN cases.</p><table-wrap id="t5" position="float"><label>Table 5.</label><caption><p>Postherpetic neuralgia cases identified by code-based methods.</p></caption><table id="table5" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom" colspan="3">Method</td><td align="left" valign="bottom">PHN<sup><xref ref-type="table-fn" rid="table5fn1">a</xref></sup> diagnosis code used</td><td align="left" valign="bottom">PHN, n (%)</td><td align="left" valign="bottom">TP<sup><xref ref-type="table-fn" rid="table5fn2">b</xref></sup> (PPV<sup><xref ref-type="table-fn" rid="table5fn3">c</xref></sup>), n (%)</td><td align="left" valign="bottom">Supplementary TP<sup><xref ref-type="table-fn" rid="table5fn4">d</xref></sup></td></tr></thead><tbody><tr><td align="left" valign="top" colspan="3">C1<sup><xref ref-type="table-fn" rid="table5fn5">e</xref></sup></td><td align="left" valign="top">&#x2713;</td><td align="left" valign="top">43 (5.4)<sup><xref ref-type="table-fn" rid="table5fn6">f</xref></sup></td><td align="left" valign="top">31 (72.1)<sup><xref ref-type="table-fn" rid="table5fn6">f</xref></sup></td><td align="left" valign="top">&#x2014;<sup><xref ref-type="table-fn" rid="table5fn7">g</xref></sup></td></tr><tr><td align="left" valign="top" colspan="3"><bold>C2</bold></td><td align="left" valign="top">&#x2713;</td><td align="left" valign="top">87 (10.9)<sup><xref ref-type="table-fn" rid="table5fn6">f</xref></sup></td><td align="left" valign="top">34 (39.1)<sup><xref ref-type="table-fn" rid="table5fn6">f</xref></sup></td><td align="left" valign="top">3<sup><xref ref-type="table-fn" rid="table5fn6">f</xref></sup></td></tr><tr><td align="left" valign="top"/><td align="left" valign="top" colspan="2">C2.1</td><td align="left" valign="top">&#x2713;</td><td align="left" valign="top">43 (5.4)</td><td align="left" valign="top">31 (72.1)</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top" colspan="2">C2.2</td><td align="left" valign="top"/><td align="left" valign="top">69 (8.6)</td><td align="left" valign="top">26 (37.7)</td><td align="left" valign="top">3</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top" colspan="2">C2.3</td><td align="left" valign="top"/><td align="left" valign="top">4 (0.5)</td><td align="left" valign="top">1 (25.0)</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top" colspan="3"><bold>C3</bold></td><td align="left" valign="top">&#x2713;</td><td align="left" valign="top">44 (5.5)<sup><xref ref-type="table-fn" rid="table5fn6">f</xref></sup></td><td align="left" valign="top">31 (70.5)<sup><xref ref-type="table-fn" rid="table5fn6">f</xref></sup></td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top" colspan="2">C3.1</td><td align="left" valign="top">&#x2713;</td><td align="left" valign="top">24 (3)</td><td align="left" valign="top">18 (75.0)</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top" colspan="2">C3.2</td><td align="left" valign="top">&#x2713;</td><td align="left" valign="top">7 (0.9)</td><td align="left" valign="top">7 (100.0)</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top" colspan="2">C3.3</td><td align="left" valign="top">&#x2713;</td><td align="left" valign="top">41 (5.1)</td><td align="left" valign="top">29 (70.7)</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top" colspan="2">C3.4</td><td align="left" valign="top">&#x2713;</td><td align="left" valign="top">23 (2.9)</td><td align="left" valign="top">17 (73.9)</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top" colspan="3"><bold>C4</bold></td><td align="left" valign="top">&#x2713;</td><td align="left" valign="top">105 (13.1)<sup><xref ref-type="table-fn" rid="table5fn6">f</xref></sup></td><td align="left" valign="top">29 (27.6)<sup><xref ref-type="table-fn" rid="table5fn6">f</xref></sup></td><td align="left" valign="top">2<sup><xref ref-type="table-fn" rid="table5fn6">f</xref></sup></td></tr><tr><td align="left" valign="top"/><td align="left" valign="top" colspan="2">C4.1</td><td align="left" valign="top">&#x2713;</td><td align="left" valign="top">36 (4.5)</td><td align="left" valign="top">26 (72.2)</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top" colspan="2"><bold>C4.2</bold></td><td align="left" valign="top"/><td align="left" valign="top">69 (8.6)</td><td align="left" valign="top">18 (26.1)</td><td align="left" valign="top">2</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top">C4.2.1</td><td align="left" valign="top"/><td align="left" valign="top">7 (0.9)</td><td align="left" valign="top">6 (85.7)</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top">C4.2.2</td><td align="left" valign="top"/><td align="left" valign="top">2 (0.3)</td><td align="left" valign="top">1 (50.0)</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top">C4.2.3</td><td align="left" valign="top"/><td align="left" valign="top">64 (8.0)</td><td align="left" valign="top">16 (25.0)</td><td align="left" valign="top">1</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top">C4.2.4</td><td align="left" valign="top"/><td align="left" valign="top">2 (0.3)</td><td align="left" valign="top">1 (50.0)</td><td align="left" valign="top">1</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top" colspan="2"><bold>C4.3</bold></td><td align="left" valign="top"/><td align="left" valign="top">29 (3.6)</td><td align="left" valign="top">3 (10.3)</td><td align="left" valign="top">2</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top">C4.3.1</td><td align="left" valign="top"/><td align="left" valign="top">25 (3.1)</td><td align="left" valign="top">1 (4.0)</td><td align="left" valign="top">1</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top">C4.3.2</td><td align="left" valign="top"/><td align="left" valign="top">2 (0.3)</td><td align="left" valign="top">1 (50.0)</td><td align="left" valign="top">1</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top">C4.3.3</td><td align="left" valign="top"/><td align="left" valign="top">2 (0.3)</td><td align="left" valign="top">1 (50.0)</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top" colspan="3"><bold>C5</bold></td><td align="left" valign="top">&#x2713;</td><td align="left" valign="top">74 (9.3)<sup><xref ref-type="table-fn" rid="table5fn6">f</xref></sup></td><td align="left" valign="top">31 (41.9)<sup><xref ref-type="table-fn" rid="table5fn6">f</xref></sup></td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top" colspan="2">C5.1</td><td align="left" valign="top">&#x2713;</td><td align="left" valign="top">43 (5.4)</td><td align="left" valign="top">31 (72.1)</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top" colspan="2">C5.2</td><td align="left" valign="top"/><td align="left" valign="top">18 (2.3)</td><td align="left" valign="top">14 (77.8)</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top" colspan="2">C5.3</td><td align="left" valign="top"/><td align="left" valign="top">34 (4.3)</td><td align="left" valign="top">2 (5.9)</td><td align="left" valign="top">&#x2014;</td></tr></tbody></table><table-wrap-foot><fn id="table5fn1"><p><sup>a</sup>PHN: postherpetic neuralgia.</p></fn><fn id="table5fn2"><p><sup>b</sup>TP: true-positive.</p></fn><fn id="table5fn3"><p><sup>c</sup>PPV: positive predictive value.</p></fn><fn id="table5fn4"><p><sup>d</sup>Supplementary contributions to the number of correctly identified positive cases, apart from method C1.</p></fn><fn id="table5fn5"><p><sup>e</sup>Method C1 only used PHN diagnosis codes.</p></fn><fn id="table5fn6"><p><sup>f</sup>Overall performance.</p></fn><fn id="table5fn7"><p><sup>g</sup>Not applicable.</p></fn></table-wrap-foot></table-wrap></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Principal Findings</title><p>We developed and validated NLP algorithms to identify PHN using various clinical data sources from EHRs. Compared with the chart-reviewed reference standard, the NLP algorithms showed high accuracy. This study demonstrates the feasibility of population-based PHN studies using EHR data with an automated method.</p><p>Using manual review to identify PHN cases is often infeasible for population-based research because a large volume of clinical notes would need to be reviewed. In contrast, the size of the study population and length of follow-up have little impact on running the NLP algorithm. Moreover, our NLP algorithm can readily capture PHN at varied time intervals, providing an efficient method to assess the long-term impact of PHN and compare results with studies using different PHN risk windows. Furthermore, studies can use NLP alone or with manual review confirmation. For example, a manual review of the NLP-positive cases (n=61) could increase the specificity and PPV to 100% and improve the F-score from 0.89 to 0.93 and MCC from 0.85 to 0.95; this is more efficient than a manual review of all 800 HZ cases.</p><p>Implementing NLP on EHR data presents challenges. In this study, data sources accounted for one-quarter of NLP errors (2 FNs and 2 FPs). First, clinical data were stored in a variety of locations within our institution&#x2019;s complex EHR system, which contains over 900,000 database tables. It is often difficult to locate the database table storing the data displayed in the EHR user interface. One FN case resulted from not including a previously unknown table. Second, selecting data sources for NLP processing is often a tradeoff. One FN and 2 FP cases resulted from including or excluding certain data sources. EHRs have also made it easy to create lengthy and bloated notes [<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref32">32</xref>]. According to recent research, over half of clinical note content is duplicated or copied from earlier notes [<xref ref-type="bibr" rid="ref32">32</xref>-<xref ref-type="bibr" rid="ref34">34</xref>]. Clinicians may copy from prior visit notes to improve recall and clinical reasoning [<xref ref-type="bibr" rid="ref35">35</xref>]. However, these replicated contents may lack temporal or contextual information, making them difficult to identify manually and challenging for NLP.</p><p>Because PHN-related symptoms such as pain and discomfort are common in a variety of medical conditions with numerous plausible causes, identifying PHN necessitates integrating the NLP-identified PHN symptoms with their associated anatomic location, temporality, and causality. These elements, however, are not always explicitly stated in clinical documents. About half of the NLP FP cases were from incorrectly attributing the complaint or treatment to PHN. These FP cases were partially explained by the NLP algorithm&#x2019;s preference for sensitivity over specificity.</p><p>Another popular method of PHN identification is using coded data from administrative claims or EHR, which could include a large sample size at a low cost. However, many of the code-based PHN identification algorithms have not been validated [<xref ref-type="bibr" rid="ref3">3</xref>]. We implemented and validated 5 code-based algorithms, including 1 that solely uses PHN diagnosis codes (C1) and 2 that had previously been validated (C2 and C3). To maximize their sensitivity, algorithms C2-C5 used the &#x201C;OR&#x201D; statement to combine various criteria. The downside of using the &#x201C;OR&#x201D; logic is the loss of PPV. Algorithms C2-C5 all had worse PPV than the diagnosis codes&#x2013;only algorithm (C1). However, in our study, the sensitivity of these algorithms ranged from 53% to 62%, with only C2 outperforming C1 (62% vs 56%). Algorithms C2-C5 had lower PPVs (28%&#x2010;71%) than C1 (72%). With such limited sensitivities, these algorithms may miss roughly half of the PHN cases. In our study, aside from the PHN diagnosis codes, the other diagnosis codes and prescription data had little impact on true case identification, instead adding complexity and increasing FPs.</p><p>Studies have used the similarity of the PHN proportions to construct the validity of their case-finding algorithms [<xref ref-type="bibr" rid="ref8">8</xref>-<xref ref-type="bibr" rid="ref11">11</xref>]. Administrative database studies reported PHN (pain persisting for &#x2265;90 days) prevalences of 3%&#x2010;14% (<xref ref-type="supplementary-material" rid="app6">Multimedia Appendix 6</xref>) [<xref ref-type="bibr" rid="ref3">3</xref>], which are comparable to the 5.4%&#x2010;13.1% prevalences of the code-based approaches in our study. The broad range of prevalences identified in previous code-based studies could be caused by variations in study design, population, and data source [<xref ref-type="bibr" rid="ref3">3</xref>]. However, the code-based approaches in this study had the same population and data source. Only the variation in algorithms could cause such a wide disparity.</p><p>We expanded the validations conducted for the 2 previously validated algorithms, which were performed on EHR data. The C2 (Klompas et al [<xref ref-type="bibr" rid="ref8">8</xref>]) algorithm was only validated with the 30-day definition in the original study, and it had 86% sensitivity and 78% PPV. In our study, algorithm C2 with the 90-day definition had notably lower sensitivity (62%) and PPV (39%). One main contributor to the variability in performance is the difference in the temporal criteria. According to Yawn [<xref ref-type="bibr" rid="ref36">36</xref>], up to 75% of pain present at 30 days disappears at 90 days, and the prevalence of PHN decreased by sixfold when the definition was changed from 30 days to 90 days. As prevalence decreases, so do the sensitivity and PPV [<xref ref-type="bibr" rid="ref37">37</xref>,<xref ref-type="bibr" rid="ref38">38</xref>]. The same trends were also reported in the original C2 paper; the PPVs for different PHN search criteria using the 30-day definition (29%&#x2010;95%) were nearly double that of using the 90-day definition (15%&#x2010;52%). The discrepancy in C2 algorithm performance between the original study and this study could be further explained by the differences in case definition. Our case definition for PHN is based on persistent PHN-related symptoms and causal attribution, not diagnosis code or medication. Algorithm C2 used ongoing symptoms or renewal of medication for HZ. The use of medications to identify PHN has some drawbacks, as PHN-related medications have a wide range of indications. For example, gabapentin, a first-line therapy for PHN, has over 20 approved and off-label uses [<xref ref-type="bibr" rid="ref39">39</xref>]. Furthermore, prescriptions can be refilled in the absence of active PHN symptoms for various non-PHN disorders.</p><p>The original C3 (Klein et al [<xref ref-type="bibr" rid="ref10">10</xref>]) algorithm was only validated on potential PHN cases identified by its 4 component criteria, rather than randomly selected HZ cases; only PPVs were reported. In this study, the 4 criteria of the C3 algorithm had PPVs ranging from 71% to 100%, which is consistent with the previous study&#x2019;s findings (PPVs ranging from 73% to 96%). The C3 algorithm was one of the best-performing code-based algorithms based on F-score and MCC. However, its low sensitivity (56%) and PPV (71%) indicate considerable misclassification. The lower overall PPV is partly due to the &#x201C;OR&#x201D; logic of the 4 criteria. Because Klein et al [<xref ref-type="bibr" rid="ref10">10</xref>] did not describe the case definition or chart review rules, we were unable to assess their impact on the performance differences between the original C3 study and this study.</p><p>The substantial misclassification of coded methods as observed in this study could have a substantial impact on measuring incidence, identifying risk factors, and assessing vaccine effectiveness. Code-based method studies (C4 and C5) had identified depression, diabetes mellitus, heart failure, and chronic obstructive pulmonary disease as risk factors for PHN. It is conceivable that the link between depression and PHN is caused by using anticonvulsants and tricyclic antidepressants to identify PHN. The inclusion of prescriptions for pain medications and chronic pain codes may contribute to the association of diabetes mellitus [<xref ref-type="bibr" rid="ref40">40</xref>], heart failure [<xref ref-type="bibr" rid="ref41">41</xref>], and chronic obstructive pulmonary disease [<xref ref-type="bibr" rid="ref42">42</xref>] with PHN.</p></sec><sec id="s4-2"><title>Study Strengths and Limitations</title><p>This study was conducted within a large integrated health care system with comprehensive EHRs. Because the health plan provides strong incentives for members to use its facilities, clinical documentation is expected to be more detailed. We developed NLP algorithms to identify PHN from various unstructured data sources within EHRs, such as clinical notes, which contain a wealth of information but differ greatly in structure, content, and quality. The algorithms were highly accurate, as evidenced by our validation. Compared with studies based on self-reported pain scores collected through surveys, EHR-based studies measure the health care burden of PHN, which is more clinically relevant. This study also has limitations. The reference standard relied on the review of EHRs which could be erroneous and incomplete [<xref ref-type="bibr" rid="ref14">14</xref>]. Moreover, rereviewing cases in the validation set where NLP results differed from research associates&#x2019; results may result in bias in favor of higher performance of the NLP algorithm. On the other hand, reconciling discrepant results improved the quality of the reference standard. Additionally, diagnosis codes, prescriptions, clinical documentation language, and style can differ between institutions and physicians. Our NLP method may perform differently in other test data sets.</p></sec><sec id="s4-3"><title>Conclusions</title><p>PHN-related diagnosis codes have low sensitivity for identifying PHN cases. Additional diagnosis codes and prescription data did little to improve sensitivity while significantly lowering the PPV. Using clinical text from the EHR, the NLP-based method identified PHN cases with high accuracy. Our NLP method can be used in EHR-based studies to identify PHN risk factors and evaluate the effectiveness of vaccinations and treatments against PHN.</p></sec></sec></body><back><ack><p>A part of this work was previously presented at IDWeek 2023, which was held in Boston, Massachusetts on October 12, 2023. This work was supported by Kaiser Permanente Southern California internal research funds.</p></ack><fn-group><fn fn-type="conflict"><p>HFT received research funding from GSK for a shingles vaccine&#x2013;related study. He also received funding from Moderna for studies unrelated to this publication.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">EHR</term><def><p>electronic health record</p></def></def-item><def-item><term id="abb2">FN</term><def><p>false-negative</p></def></def-item><def-item><term id="abb3">FP</term><def><p>false-positive</p></def></def-item><def-item><term id="abb4">HZ</term><def><p>herpes zoster</p></def></def-item><def-item><term id="abb5">KPSC</term><def><p>Kaiser Permanente Southern California</p></def></def-item><def-item><term id="abb6">MCC</term><def><p>Matthews correlation coefficient</p></def></def-item><def-item><term id="abb7">NLP</term><def><p>natural language processing</p></def></def-item><def-item><term id="abb8">NPV</term><def><p>negative predictive value</p></def></def-item><def-item><term id="abb9">PHN</term><def><p>postherpetic neuralgia</p></def></def-item><def-item><term id="abb10">PPV</term><def><p>positive predictive value</p></def></def-item><def-item><term id="abb11">TN</term><def><p>true-negative</p></def></def-item><def-item><term id="abb12">TP</term><def><p>true-positive</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gershon</surname><given-names>AA</given-names> </name><name name-style="western"><surname>Breuer</surname><given-names>J</given-names> </name><name name-style="western"><surname>Cohen</surname><given-names>JI</given-names> </name><etal/></person-group><article-title>Varicella zoster virus infection</article-title><source>Nat Rev Dis Primers</source><year>2015</year><month>07</month><day>2</day><volume>1</volume><fpage>15016</fpage><pub-id pub-id-type="doi">10.1038/nrdp.2015.16</pub-id><pub-id pub-id-type="medline">27188665</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gnann</surname><given-names>JW</given-names> </name><name name-style="western"><surname>Whitley</surname><given-names>RJ</given-names> </name></person-group><article-title>Clinical practice. herpes zoster</article-title><source>N Engl J Med</source><year>2002</year><month>08</month><day>1</day><volume>347</volume><issue>5</issue><fpage>340</fpage><lpage>346</lpage><pub-id pub-id-type="doi">10.1056/NEJMcp013211</pub-id><pub-id pub-id-type="medline">12151472</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kawai</surname><given-names>K</given-names> </name><name name-style="western"><surname>Gebremeskel</surname><given-names>BG</given-names> </name><name name-style="western"><surname>Acosta</surname><given-names>CJ</given-names> </name></person-group><article-title>Systematic review of incidence and complications of herpes zoster: towards a global perspective</article-title><source>BMJ Open</source><year>2014</year><month>06</month><day>10</day><volume>4</volume><issue>6</issue><fpage>e004833</fpage><pub-id pub-id-type="doi">10.1136/bmjopen-2014-004833</pub-id><pub-id pub-id-type="medline">24916088</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Johnson</surname><given-names>RW</given-names> </name><name name-style="western"><surname>Alvarez-Pasquin</surname><given-names>MJ</given-names> </name><name name-style="western"><surname>Bijl</surname><given-names>M</given-names> </name><etal/></person-group><article-title>Herpes zoster epidemiology, management, and disease and economic burden in Europe: a multidisciplinary perspective</article-title><source>Ther Adv Vaccines</source><year>2015</year><month>07</month><volume>3</volume><issue>4</issue><fpage>109</fpage><lpage>120</lpage><pub-id pub-id-type="doi">10.1177/2051013615599151</pub-id><pub-id pub-id-type="medline">26478818</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Johnson</surname><given-names>RW</given-names> </name><name name-style="western"><surname>Rice</surname><given-names>ASC</given-names> </name></person-group><article-title>Postherpetic neuralgia</article-title><source>N Engl J Med</source><year>2014</year><month>10</month><day>16</day><volume>371</volume><issue>16</issue><fpage>1526</fpage><lpage>1533</lpage><pub-id pub-id-type="doi">10.1056/NEJMcp1403062</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Rowbotham</surname><given-names>M</given-names> </name><name name-style="western"><surname>Harden</surname><given-names>N</given-names> </name><name name-style="western"><surname>Stacey</surname><given-names>B</given-names> </name><name name-style="western"><surname>Bernstein</surname><given-names>P</given-names> </name><name name-style="western"><surname>Magnus-Miller</surname><given-names>L</given-names> </name></person-group><article-title>Gabapentin for the treatment of postherpetic neuralgia: a randomized controlled trial</article-title><source>JAMA</source><year>1998</year><month>12</month><day>2</day><volume>280</volume><issue>21</issue><fpage>1837</fpage><lpage>1842</lpage><pub-id pub-id-type="doi">10.1001/jama.280.21.1837</pub-id><pub-id pub-id-type="medline">9846778</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lal</surname><given-names>H</given-names> </name><name name-style="western"><surname>Cunningham</surname><given-names>AL</given-names> </name><name name-style="western"><surname>Godeaux</surname><given-names>O</given-names> </name><etal/></person-group><article-title>Efficacy of an adjuvanted herpes zoster subunit vaccine in older adults</article-title><source>N Engl J Med</source><year>2015</year><month>05</month><day>28</day><volume>372</volume><issue>22</issue><fpage>2087</fpage><lpage>2096</lpage><pub-id pub-id-type="doi">10.1056/NEJMoa1501184</pub-id><pub-id pub-id-type="medline">25916341</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Klompas</surname><given-names>M</given-names> </name><name name-style="western"><surname>Kulldorff</surname><given-names>M</given-names> </name><name name-style="western"><surname>Vilk</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Bialek</surname><given-names>SR</given-names> </name><name name-style="western"><surname>Harpaz</surname><given-names>R</given-names> </name></person-group><article-title>Herpes zoster and postherpetic neuralgia surveillance using structured electronic data</article-title><source>Mayo Clin Proc</source><year>2011</year><month>12</month><volume>86</volume><issue>12</issue><fpage>1146</fpage><lpage>1153</lpage><pub-id pub-id-type="doi">10.4065/mcp.2011.0305</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Forbes</surname><given-names>HJ</given-names> </name><name name-style="western"><surname>Bhaskaran</surname><given-names>K</given-names> </name><name name-style="western"><surname>Thomas</surname><given-names>SL</given-names> </name><etal/></person-group><article-title>Quantification of risk factors for postherpetic neuralgia in herpes zoster patients: a cohort study</article-title><source>Neurology (ECronicon)</source><year>2016</year><month>07</month><day>5</day><volume>87</volume><issue>1</issue><fpage>94</fpage><lpage>102</lpage><pub-id pub-id-type="doi">10.1212/WNL.0000000000002808</pub-id><pub-id pub-id-type="medline">27287218</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Klein</surname><given-names>NP</given-names> </name><name name-style="western"><surname>Bartlett</surname><given-names>J</given-names> </name><name name-style="western"><surname>Fireman</surname><given-names>B</given-names> </name><etal/></person-group><article-title>Long-term effectiveness of zoster vaccine live for postherpetic neuralgia prevention</article-title><source>Vaccine (Auckl)</source><year>2019</year><month>08</month><day>23</day><volume>37</volume><issue>36</issue><fpage>5422</fpage><lpage>5427</lpage><pub-id pub-id-type="doi">10.1016/j.vaccine.2019.07.004</pub-id><pub-id pub-id-type="medline">31301920</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mu&#x00F1;oz-Quiles</surname><given-names>C</given-names> </name><name name-style="western"><surname>L&#x00F3;pez-Lacort</surname><given-names>M</given-names> </name><name name-style="western"><surname>Orrico-S&#x00E1;nchez</surname><given-names>A</given-names> </name><name name-style="western"><surname>D&#x00ED;ez-Domingo</surname><given-names>J</given-names> </name></person-group><article-title>Impact of postherpetic neuralgia: a six year population-based analysis on people aged 50 years or older</article-title><source>J Infect</source><year>2018</year><month>08</month><volume>77</volume><issue>2</issue><fpage>131</fpage><lpage>136</lpage><pub-id pub-id-type="doi">10.1016/j.jinf.2018.04.004</pub-id><pub-id pub-id-type="medline">29742472</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Suaya</surname><given-names>JA</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>SY</given-names> </name><name name-style="western"><surname>Li</surname><given-names>Q</given-names> </name><name name-style="western"><surname>Burstin</surname><given-names>SJ</given-names> </name><name name-style="western"><surname>Levin</surname><given-names>MJ</given-names> </name></person-group><article-title>Incidence of herpes zoster and persistent post-zoster pain in adults with or without diabetes in the United States</article-title><source>Open Forum Infect Dis</source><year>2014</year><month>09</month><volume>1</volume><issue>2</issue><fpage>ofu049</fpage><pub-id pub-id-type="doi">10.1093/ofid/ofu049</pub-id><pub-id pub-id-type="medline">25734121</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hillebrand</surname><given-names>K</given-names> </name><name name-style="western"><surname>Bricout</surname><given-names>H</given-names> </name><name name-style="western"><surname>Schulze-Rath</surname><given-names>R</given-names> </name><name name-style="western"><surname>Schink</surname><given-names>T</given-names> </name><name name-style="western"><surname>Garbe</surname><given-names>E</given-names> </name></person-group><article-title>Incidence of herpes zoster and its complications in Germany, 2005-2009</article-title><source>J Infect</source><year>2015</year><month>02</month><volume>70</volume><issue>2</issue><fpage>178</fpage><lpage>186</lpage><pub-id pub-id-type="doi">10.1016/j.jinf.2014.08.018</pub-id><pub-id pub-id-type="medline">25230396</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Yawn</surname><given-names>BP</given-names> </name><name name-style="western"><surname>Wollan</surname><given-names>P</given-names> </name><name name-style="western"><surname>St Sauver</surname><given-names>J</given-names> </name></person-group><article-title>Comparing shingles incidence and complication rates from medical record review and administrative database estimates: how close are they?</article-title><source>Am J Epidemiol</source><year>2011</year><month>11</month><day>1</day><volume>174</volume><issue>9</issue><fpage>1054</fpage><lpage>1061</lpage><pub-id pub-id-type="doi">10.1093/aje/kwr206</pub-id><pub-id pub-id-type="medline">21920944</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Tanenbaum</surname><given-names>HC</given-names> </name><name name-style="western"><surname>Lawless</surname><given-names>A</given-names> </name><name name-style="western"><surname>Sy</surname><given-names>LS</given-names> </name><etal/></person-group><article-title>Differences in estimates of post-herpetic neuralgia between medical chart review and self-report</article-title><source>J Pain Res</source><year>2020</year><volume>13</volume><fpage>1757</fpage><lpage>1762</lpage><pub-id pub-id-type="doi">10.2147/JPR.S255238</pub-id><pub-id pub-id-type="medline">32765050</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Tseng</surname><given-names>HF</given-names> </name><name name-style="western"><surname>Lewin</surname><given-names>B</given-names> </name><name name-style="western"><surname>Hales</surname><given-names>CM</given-names> </name><etal/></person-group><article-title>Zoster vaccine and the risk of postherpetic neuralgia in patients who developed herpes zoster despite having received the zoster vaccine</article-title><source>J Infect Dis</source><year>2015</year><month>10</month><day>15</day><volume>212</volume><issue>8</issue><fpage>1222</fpage><lpage>1231</lpage><pub-id pub-id-type="doi">10.1093/infdis/jiv244</pub-id><pub-id pub-id-type="medline">26038400</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zheng</surname><given-names>C</given-names> </name><name name-style="western"><surname>Luo</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Mercado</surname><given-names>C</given-names> </name><etal/></person-group><article-title>Using natural language processing for identification of herpes zoster ophthalmicus cases to support population-based study</article-title><source>Clin Exp Ophthalmol</source><year>2019</year><month>01</month><volume>47</volume><issue>1</issue><fpage>7</fpage><lpage>14</lpage><pub-id pub-id-type="doi">10.1111/ceo.13340</pub-id><pub-id pub-id-type="medline">29920898</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zheng</surname><given-names>C</given-names> </name><name name-style="western"><surname>Sy</surname><given-names>LS</given-names> </name><name name-style="western"><surname>Tanenbaum</surname><given-names>H</given-names> </name><etal/></person-group><article-title>Text-based identification of herpes zoster ophthalmicus with ocular involvement in the electronic health record: a population-based study</article-title><source>Open Forum Infect Dis</source><year>2021</year><month>02</month><volume>8</volume><issue>2</issue><fpage>ofaa652</fpage><pub-id pub-id-type="doi">10.1093/ofid/ofaa652</pub-id><pub-id pub-id-type="medline">33575426</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Delaney</surname><given-names>A</given-names> </name><name name-style="western"><surname>Colvin</surname><given-names>LA</given-names> </name><name name-style="western"><surname>Fallon</surname><given-names>MT</given-names> </name><name name-style="western"><surname>Dalziel</surname><given-names>RG</given-names> </name><name name-style="western"><surname>Mitchell</surname><given-names>R</given-names> </name><name name-style="western"><surname>Fleetwood-Walker</surname><given-names>SM</given-names> </name></person-group><article-title>Postherpetic neuralgia: from preclinical models to the clinic</article-title><source>Neurotherapeutics</source><year>2009</year><month>10</month><volume>6</volume><issue>4</issue><fpage>630</fpage><lpage>637</lpage><pub-id pub-id-type="doi">10.1016/j.nurt.2009.07.005</pub-id><pub-id pub-id-type="medline">19789068</pub-id></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Forbes</surname><given-names>HJ</given-names> </name><name name-style="western"><surname>Thomas</surname><given-names>SL</given-names> </name><name name-style="western"><surname>Smeeth</surname><given-names>L</given-names> </name><etal/></person-group><article-title>A systematic review and meta-analysis of risk factors for postherpetic neuralgia</article-title><source>Pain</source><year>2016</year><month>01</month><volume>157</volume><issue>1</issue><fpage>30</fpage><lpage>54</lpage><pub-id pub-id-type="doi">10.1097/j.pain.0000000000000307</pub-id><pub-id pub-id-type="medline">26218719</pub-id></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Coplan</surname><given-names>PM</given-names> </name><name name-style="western"><surname>Schmader</surname><given-names>K</given-names> </name><name name-style="western"><surname>Nikas</surname><given-names>A</given-names> </name><etal/></person-group><article-title>Development of a measure of the burden of pain due to herpes zoster and postherpetic neuralgia for prevention trials: adaptation of the brief pain inventory</article-title><source>J Pain</source><year>2004</year><month>08</month><volume>5</volume><issue>6</issue><fpage>344</fpage><lpage>356</lpage><pub-id pub-id-type="doi">10.1016/j.jpain.2004.06.001</pub-id><pub-id pub-id-type="medline">15336639</pub-id></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zheng</surname><given-names>C</given-names> </name><name name-style="western"><surname>Rashid</surname><given-names>N</given-names> </name><name name-style="western"><surname>Wu</surname><given-names>YL</given-names> </name><etal/></person-group><article-title>Using natural language processing and machine learning to identify gout flares from electronic clinical notes</article-title><source>Arthritis Care Res (Hoboken)</source><year>2014</year><month>11</month><volume>66</volume><issue>11</issue><fpage>1740</fpage><lpage>1748</lpage><pub-id pub-id-type="doi">10.1002/acr.22324</pub-id><pub-id pub-id-type="medline">24664671</pub-id></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zheng</surname><given-names>C</given-names> </name><name name-style="western"><surname>Sun</surname><given-names>BC</given-names> </name><name name-style="western"><surname>Wu</surname><given-names>YL</given-names> </name><etal/></person-group><article-title>Automated identification and extraction of exercise treadmill test results</article-title><source>J Am Heart Assoc</source><year>2020</year><month>03</month><day>3</day><volume>9</volume><issue>5</issue><fpage>e014940</fpage><pub-id pub-id-type="doi">10.1161/JAHA.119.014940</pub-id><pub-id pub-id-type="medline">32079480</pub-id></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zheng</surname><given-names>C</given-names> </name><name name-style="western"><surname>Yu</surname><given-names>W</given-names> </name><name name-style="western"><surname>Xie</surname><given-names>F</given-names> </name><etal/></person-group><article-title>The use of natural language processing to identify Tdap-related local reactions at five health care systems in the Vaccine Safety Datalink</article-title><source>Int J Med Inform</source><year>2019</year><month>07</month><volume>127</volume><fpage>27</fpage><lpage>34</lpage><pub-id pub-id-type="doi">10.1016/j.ijmedinf.2019.04.009</pub-id><pub-id pub-id-type="medline">31128829</pub-id></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zheng</surname><given-names>C</given-names> </name><name name-style="western"><surname>Duffy</surname><given-names>J</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>ILA</given-names> </name><etal/></person-group><article-title>Identifying cases of shoulder injury related to vaccine administration (SIRVA) in the United States: development and validation of a natural language processing method</article-title><source>JMIR Public Health Surveill</source><year>2022</year><month>05</month><day>24</day><volume>8</volume><issue>5</issue><fpage>e30426</fpage><pub-id pub-id-type="doi">10.2196/30426</pub-id><pub-id pub-id-type="medline">35608886</pub-id></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zheng</surname><given-names>C</given-names> </name><name name-style="western"><surname>Rashid</surname><given-names>N</given-names> </name><name name-style="western"><surname>Koblick</surname><given-names>R</given-names> </name><name name-style="western"><surname>An</surname><given-names>J</given-names> </name></person-group><article-title>Medication extraction from electronic clinical notes in an integrated health system: a study on aspirin use in patients with nonvalvular atrial fibrillation</article-title><source>Clin Ther</source><year>2015</year><month>09</month><volume>37</volume><issue>9</issue><fpage>2048</fpage><lpage>2058</lpage><pub-id pub-id-type="doi">10.1016/j.clinthera.2015.07.002</pub-id><pub-id pub-id-type="medline">26233471</pub-id></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Yanni</surname><given-names>EA</given-names> </name><name name-style="western"><surname>Ferreira</surname><given-names>G</given-names> </name><name name-style="western"><surname>Guennec</surname><given-names>M</given-names> </name><etal/></person-group><article-title>Burden of herpes zoster in 16 selected immunocompromised populations in England: a cohort study in the Clinical Practice Research Datalink 2000-2012</article-title><source>BMJ Open</source><year>2018</year><month>06</month><day>7</day><volume>8</volume><issue>6</issue><fpage>e020528</fpage><pub-id pub-id-type="doi">10.1136/bmjopen-2017-020528</pub-id><pub-id pub-id-type="medline">29880565</pub-id></nlm-citation></ref><ref id="ref28"><label>28</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Derczynski</surname><given-names>L</given-names> </name></person-group><article-title>Complementarity, F-score, and NLP evaluation</article-title><conf-name>Tenth International Conference on Language Resources and Evaluation (LREC&#x2019;16)</conf-name><conf-date>May 23-28, 2016</conf-date><conf-loc>Portoro&#x017E;, Slovenia</conf-loc></nlm-citation></ref><ref id="ref29"><label>29</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chicco</surname><given-names>D</given-names> </name><name name-style="western"><surname>Jurman</surname><given-names>G</given-names> </name></person-group><article-title>The advantages of the Matthews correlation coefficient (MCC) over F1 score and accuracy in binary classification evaluation</article-title><source>BMC Genomics</source><year>2020</year><month>01</month><day>2</day><volume>21</volume><issue>1</issue><fpage>6</fpage><pub-id pub-id-type="doi">10.1186/s12864-019-6413-7</pub-id><pub-id pub-id-type="medline">31898477</pub-id></nlm-citation></ref><ref id="ref30"><label>30</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chicco</surname><given-names>D</given-names> </name><name name-style="western"><surname>Jurman</surname><given-names>G</given-names> </name></person-group><article-title>The Matthews correlation coefficient (MCC) should replace the ROC AUC as the standard metric for assessing binary classification</article-title><source>BioData Min</source><year>2023</year><month>02</month><day>17</day><volume>16</volume><issue>1</issue><fpage>4</fpage><pub-id pub-id-type="doi">10.1186/s13040-023-00322-4</pub-id><pub-id pub-id-type="medline">36800973</pub-id></nlm-citation></ref><ref id="ref31"><label>31</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Downing</surname><given-names>NL</given-names> </name><name name-style="western"><surname>Bates</surname><given-names>DW</given-names> </name><name name-style="western"><surname>Longhurst</surname><given-names>CA</given-names> </name></person-group><article-title>Physician burnout in the electronic health record era: are we ignoring the real cause?</article-title><source>Ann Intern Med</source><year>2018</year><month>07</month><day>3</day><volume>169</volume><issue>1</issue><fpage>50</fpage><lpage>51</lpage><pub-id pub-id-type="doi">10.7326/M18-0139</pub-id><pub-id pub-id-type="medline">29801050</pub-id></nlm-citation></ref><ref id="ref32"><label>32</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Rule</surname><given-names>A</given-names> </name><name name-style="western"><surname>Bedrick</surname><given-names>S</given-names> </name><name name-style="western"><surname>Chiang</surname><given-names>MF</given-names> </name><name name-style="western"><surname>Hribar</surname><given-names>MR</given-names> </name></person-group><article-title>Length and redundancy of outpatient progress notes across a decade at an academic medical center</article-title><source>JAMA Netw Open</source><year>2021</year><month>07</month><day>1</day><volume>4</volume><issue>7</issue><fpage>e2115334</fpage><pub-id pub-id-type="doi">10.1001/jamanetworkopen.2021.15334</pub-id><pub-id pub-id-type="medline">34279650</pub-id></nlm-citation></ref><ref id="ref33"><label>33</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Steinkamp</surname><given-names>J</given-names> </name><name name-style="western"><surname>Kantrowitz</surname><given-names>JJ</given-names> </name><name name-style="western"><surname>Airan-Javia</surname><given-names>S</given-names> </name></person-group><article-title>Prevalence and sources of duplicate information in the electronic medical record</article-title><source>JAMA Netw Open</source><year>2022</year><month>09</month><day>1</day><volume>5</volume><issue>9</issue><fpage>e2233348</fpage><pub-id pub-id-type="doi">10.1001/jamanetworkopen.2022.33348</pub-id><pub-id pub-id-type="medline">36156143</pub-id></nlm-citation></ref><ref id="ref34"><label>34</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wang</surname><given-names>MD</given-names> </name><name name-style="western"><surname>Khanna</surname><given-names>R</given-names> </name><name name-style="western"><surname>Najafi</surname><given-names>N</given-names> </name></person-group><article-title>Characterizing the source of text in electronic health record progress notes</article-title><source>JAMA Intern Med</source><year>2017</year><month>08</month><day>1</day><volume>177</volume><issue>8</issue><fpage>1212</fpage><lpage>1213</lpage><pub-id pub-id-type="doi">10.1001/jamainternmed.2017.1548</pub-id><pub-id pub-id-type="medline">28558106</pub-id></nlm-citation></ref><ref id="ref35"><label>35</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zheng</surname><given-names>C</given-names> </name><name name-style="western"><surname>Lee</surname><given-names>MS</given-names> </name><name name-style="western"><surname>Bansal</surname><given-names>N</given-names> </name><etal/></person-group><article-title>Identification of recurrent atrial fibrillation using natural language processing applied to electronic health records</article-title><source>Eur Heart J Qual Care Clin Outcomes</source><year>2024</year><month>01</month><day>12</day><volume>10</volume><issue>1</issue><fpage>77</fpage><lpage>88</lpage><pub-id pub-id-type="doi">10.1093/ehjqcco/qcad021</pub-id><pub-id pub-id-type="medline">36997334</pub-id></nlm-citation></ref><ref id="ref36"><label>36</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Yawn</surname><given-names>BP</given-names> </name></person-group><article-title>Post-shingles neuralgia by any definition is painful, but is it PHN?</article-title><source>Mayo Clin Proc</source><year>2011</year><month>12</month><volume>86</volume><issue>12</issue><fpage>1141</fpage><lpage>1142</lpage><pub-id pub-id-type="doi">10.4065/mcp.2011.0724</pub-id><pub-id pub-id-type="medline">22134931</pub-id></nlm-citation></ref><ref id="ref37"><label>37</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Murad</surname><given-names>MH</given-names> </name><name name-style="western"><surname>Lin</surname><given-names>L</given-names> </name><name name-style="western"><surname>Chu</surname><given-names>H</given-names> </name><etal/></person-group><article-title>The association of sensitivity and specificity with disease prevalence: analysis of 6909 studies of diagnostic test accuracy</article-title><source>CMAJ</source><year>2023</year><month>07</month><day>17</day><volume>195</volume><issue>27</issue><fpage>E925</fpage><lpage>E931</lpage><pub-id pub-id-type="doi">10.1503/cmaj.221802</pub-id><pub-id pub-id-type="medline">37460126</pub-id></nlm-citation></ref><ref id="ref38"><label>38</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Tenny</surname><given-names>S</given-names> </name><name name-style="western"><surname>Hoffman</surname><given-names>MR</given-names> </name></person-group><article-title>Prevalence</article-title><source>StatPearls [Internet]</source><year>2023</year><access-date>2024-09-04</access-date><publisher-name>StatPearls Publishing</publisher-name><comment><ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/books/NBK430867/">https://www.ncbi.nlm.nih.gov/books/NBK430867/</ext-link></comment></nlm-citation></ref><ref id="ref39"><label>39</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Yasaei</surname><given-names>R</given-names> </name><name name-style="western"><surname>Katta</surname><given-names>S</given-names> </name><name name-style="western"><surname>Patel</surname><given-names>P</given-names> </name><name name-style="western"><surname>Saadabadi</surname><given-names>A</given-names> </name></person-group><article-title>Gabapentin</article-title><source>StatPearls [Internet]</source><year>2024</year><access-date>2024-09-04</access-date><publisher-name>StatPearls Publishing</publisher-name><comment><ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/books/NBK493228/">https://www.ncbi.nlm.nih.gov/books/NBK493228/</ext-link></comment></nlm-citation></ref><ref id="ref40"><label>40</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Dyck</surname><given-names>PJ</given-names> </name><name name-style="western"><surname>Kratz</surname><given-names>KM</given-names> </name><name name-style="western"><surname>Karnes</surname><given-names>JL</given-names> </name><etal/></person-group><article-title>The prevalence by staged severity of various types of diabetic neuropathy, retinopathy, and nephropathy in a population-based cohort: the Rochester Diabetic Neuropathy Study</article-title><source>Neurology (ECronicon)</source><year>1993</year><month>04</month><volume>43</volume><issue>4</issue><fpage>817</fpage><lpage>824</lpage><pub-id pub-id-type="doi">10.1212/wnl.43.4.817</pub-id><pub-id pub-id-type="medline">8469345</pub-id></nlm-citation></ref><ref id="ref41"><label>41</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Alemzadeh-Ansari</surname><given-names>MJ</given-names> </name><name name-style="western"><surname>Ansari-Ramandi</surname><given-names>MM</given-names> </name><name name-style="western"><surname>Naderi</surname><given-names>N</given-names> </name></person-group><article-title>Chronic pain in chronic heart failure: a review article</article-title><source>J Tehran Heart Cent</source><year>2017</year><month>04</month><volume>12</volume><issue>2</issue><fpage>49</fpage><lpage>56</lpage><pub-id pub-id-type="medline">28828019</pub-id></nlm-citation></ref><ref id="ref42"><label>42</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Anden&#x00E6;s</surname><given-names>R</given-names> </name><name name-style="western"><surname>Momyr</surname><given-names>A</given-names> </name><name name-style="western"><surname>Brekke</surname><given-names>I</given-names> </name></person-group><article-title>Reporting of pain by people with chronic obstructive pulmonary disease (COPD): comparative results from the HUNT3 population-based survey</article-title><source>BMC Public Health</source><year>2018</year><month>01</month><day>25</day><volume>18</volume><issue>1</issue><fpage>181</fpage><pub-id pub-id-type="doi">10.1186/s12889-018-5094-5</pub-id><pub-id pub-id-type="medline">29370850</pub-id></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Multimedia Appendix 1</label><p>Postherpetic neuralgia abstraction decision rules.</p><media xlink:href="medinform_v12i1e57949_app1.docx" xlink:title="DOCX File, 30 KB"/></supplementary-material><supplementary-material id="app2"><label>Multimedia Appendix 2</label><p>Additional details on natural language processing algorithm development.</p><media xlink:href="medinform_v12i1e57949_app2.docx" xlink:title="DOCX File, 30 KB"/></supplementary-material><supplementary-material id="app3"><label>Multimedia Appendix 3</label><p>Code-based methods.</p><media xlink:href="medinform_v12i1e57949_app3.docx" xlink:title="DOCX File, 38 KB"/></supplementary-material><supplementary-material id="app4"><label>Multimedia Appendix 4</label><p>The proportion of herpes zoster&#x2013; or postherpetic neuralgia&#x2013;related notes by department/specialty.</p><media xlink:href="medinform_v12i1e57949_app4.docx" xlink:title="DOCX File, 81 KB"/></supplementary-material><supplementary-material id="app5"><label>Multimedia Appendix 5</label><p>Number and percentage of herpes zoster locations as identified by natural language processing.</p><media xlink:href="medinform_v12i1e57949_app5.docx" xlink:title="DOCX File, 32 KB"/></supplementary-material><supplementary-material id="app6"><label>Multimedia Appendix 6</label><p>Reported postherpetic neuralgia rates in previous administrative database studies.</p><media xlink:href="medinform_v12i1e57949_app6.docx" xlink:title="DOCX File, 32 KB"/></supplementary-material></app-group></back></article>