<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMI</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Med Inform</journal-id>
      <journal-title>JMIR Medical Informatics</journal-title>
      <issn pub-type="epub">2291-9694</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v9i11e29768</article-id>
      <article-id pub-id-type="pmid">34847064</article-id>
      <article-id pub-id-type="doi">10.2196/29768</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>A Pipeline to Understand Emerging Illness Via Social Media Data Analysis: Case Study on Breast Implant Illness</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Lovis</surname>
            <given-names>Christian</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Chen</surname>
            <given-names>Anfan</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Foufi</surname>
            <given-names>Vasiliki</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Wakamiya</surname>
            <given-names>Shoko</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Timakum</surname>
            <given-names>Tatsawan</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author">
          <name name-style="western">
            <surname>Dey</surname>
            <given-names>Vishal</given-names>
          </name>
          <degrees>BSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-7832-0915</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Krasniak</surname>
            <given-names>Peter</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-6490-2025</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Nguyen</surname>
            <given-names>Minh</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-1487-1152</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Lee</surname>
            <given-names>Clara</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-0514-9448</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Ning</surname>
            <given-names>Xia</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <address>
            <institution>Department of Biomedical Informatics</institution>
            <institution>The Ohio State University</institution>
            <addr-line>1800 Cannon Drive</addr-line>
            <addr-line>Columbus, OH, 43210</addr-line>
            <country>United States</country>
            <phone>1 6143662287</phone>
            <email>ning.104@osu.edu</email>
          </address>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-6842-1165</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Department of Computer Science and Engineering</institution>
        <institution>The Ohio State University</institution>
        <addr-line>Columbus, OH</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Department of Biomedical Informatics</institution>
        <institution>The Ohio State University</institution>
        <addr-line>Columbus, OH</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Translational Data Analytics Institute</institution>
        <institution>The Ohio State University</institution>
        <addr-line>Columbus, OH</addr-line>
        <country>United States</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Xia Ning <email>ning.104@osu.edu</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <month>11</month>
        <year>2021</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>29</day>
        <month>11</month>
        <year>2021</year>
      </pub-date>
      <volume>9</volume>
      <issue>11</issue>
      <elocation-id>e29768</elocation-id>
      <history>
        <date date-type="received">
          <day>19</day>
          <month>4</month>
          <year>2021</year>
        </date>
        <date date-type="rev-request">
          <day>5</day>
          <month>6</month>
          <year>2021</year>
        </date>
        <date date-type="rev-recd">
          <day>31</day>
          <month>7</month>
          <year>2021</year>
        </date>
        <date date-type="accepted">
          <day>23</day>
          <month>9</month>
          <year>2021</year>
        </date>
      </history>
      <copyright-statement>©Vishal Dey, Peter Krasniak, Minh Nguyen, Clara Lee, Xia Ning. Originally published in JMIR Medical Informatics (https://medinform.jmir.org), 29.11.2021.</copyright-statement>
      <copyright-year>2021</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Informatics, is properly cited. The complete bibliographic information, a link to the original publication on https://medinform.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://medinform.jmir.org/2021/11/e29768" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>A new illness can come to public attention through social media before it is medically defined, formally documented, or systematically studied. One example is a condition known as breast implant illness (BII), which has been extensively discussed on social media, although it is vaguely defined in the medical literature.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>The objective of this study is to construct a data analysis pipeline to understand emerging illnesses using social media data and to apply the pipeline to understand the key attributes of BII.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>We constructed a pipeline of social media data analysis using natural language processing and topic modeling. Mentions related to signs, symptoms, diseases, disorders, and medical procedures were extracted from social media data using the clinical Text Analysis and Knowledge Extraction System. We mapped the mentions to standard medical concepts and then summarized these mapped concepts as topics using latent Dirichlet allocation. Finally, we applied this pipeline to understand BII from several BII-dedicated social media sites.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>Our pipeline identified topics related to toxicity, cancer, and mental health issues that were highly associated with BII. Our pipeline also showed that cancers, autoimmune disorders, and mental health problems were emerging concerns associated with breast implants, based on social media discussions. Furthermore, the pipeline identified mentions such as rupture, infection, pain, and fatigue as common self-reported issues among the public, as well as concerns about toxicity from silicone implants.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>Our study could inspire future studies on the suggested symptoms and factors of BII. Our study provides the first analysis and derived knowledge of BII from social media using natural language processing techniques and demonstrates the potential of using social media information to better understand similar emerging illnesses.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>breast implant illness</kwd>
        <kwd>social media</kwd>
        <kwd>natural language processing</kwd>
        <kwd>topic modeling</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <sec>
        <title>Background</title>
        <p>The ubiquity of social media has resulted in early descriptions of new and evolving diseases on social media platforms before they can be systematically studied [<xref ref-type="bibr" rid="ref1">1</xref>-<xref ref-type="bibr" rid="ref7">7</xref>], particularly during the era of the medical internet [<xref ref-type="bibr" rid="ref8">8</xref>-<xref ref-type="bibr" rid="ref14">14</xref>]. Social media users increasingly turn to platforms such as Twitter (Twitter Inc), Facebook (Facebook Inc), and YouTube (Google LLC) to share personal experiences, including diseases and illnesses they have experienced, or to seek support and resources, such as health and medical resources. Recent studies have shown the potential of social media in the detection of mental illness and depression [<xref ref-type="bibr" rid="ref15">15</xref>-<xref ref-type="bibr" rid="ref17">17</xref>] and in the early detection of food-borne illnesses [<xref ref-type="bibr" rid="ref18">18</xref>-<xref ref-type="bibr" rid="ref20">20</xref>] and other infectious diseases [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref21">21</xref>-<xref ref-type="bibr" rid="ref24">24</xref>]. Furthermore, several studies have demonstrated social media as an effective tool to disseminate information regarding symptoms, personal well-being, and public health resources during multiple influenza outbreaks [<xref ref-type="bibr" rid="ref25">25</xref>-<xref ref-type="bibr" rid="ref28">28</xref>]. During the early stages of COVID-19, studies [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref30">30</xref>] analyzed posts on Sina Weibo (Weibo Corporation)—a major Chinese microblogging site—to characterize patient symptoms and public concerns in multiple provinces of China. From the analysis of Weibo (Weibo Corporation) posts, Huang et al [<xref ref-type="bibr" rid="ref30">30</xref>] concluded that most of the affected patients were older persons, with fever as the most common symptom. These studies demonstrate that public social media data can be leveraged to better understand emerging illnesses and to accommodate prompt responses.</p>
        <p>One new illness we studied in this manuscript was breast implant illness (BII). Breast implants have gained popularity over the last 20 years [<xref ref-type="bibr" rid="ref31">31</xref>]. During this period, more than 400,000 women have undergone breast augmentation or postmastectomy surgeries every year in the United States [<xref ref-type="bibr" rid="ref32">32</xref>]. There was a 4% increase in the number of breast augmentation procedures between 2017 and 2018, and a 6% increase in breast implant removal procedures occurred over the same period [<xref ref-type="bibr" rid="ref32">32</xref>]. Concerns about the safety of breast implants have also arisen [<xref ref-type="bibr" rid="ref33">33</xref>-<xref ref-type="bibr" rid="ref38">38</xref>] and persisted [<xref ref-type="bibr" rid="ref39">39</xref>-<xref ref-type="bibr" rid="ref45">45</xref>]. However, although a causal link between breast implants and systemic diseases has not been definitively shown, a phenomenon called <italic>breast implant illness</italic>, which attributes systemic symptoms to breast implants, has emerged [<xref ref-type="bibr" rid="ref46">46</xref>]. Unlike other new medical illnesses, however, BII has been reported minimally in the medical literature, being primarily limited to social media [<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref47">47</xref>-<xref ref-type="bibr" rid="ref50">50</xref>]. For example, a recent analysis [<xref ref-type="bibr" rid="ref49">49</xref>] demonstrated increasing public interest in BII based on Twitter and Google Trends data from February 2018 to February 2019. To summarize the key symptoms, diseases, and disorders defining BII, several cohort studies [<xref ref-type="bibr" rid="ref51">51</xref>,<xref ref-type="bibr" rid="ref52">52</xref>] have analyzed patient-reported outcomes before and after breast explant surgeries. These studies showed some potential relationships between explant surgeries and the improvement of specific symptoms in the patient population. Unfortunately, these studies were not definitive because of their limited study design secondary to their lack of control groups, data collection bias, and lack of randomization. The lack of medical knowledge about BII makes it difficult to define the condition, and therefore, it is nearly impossible to conduct rigorous epidemiological or clinical studies. BII is just one disease process for which the lack of medical knowledge is apparent, but there are many other new illnesses for which this is the case. Any initial knowledge that is supported by sufficient social media data would be meaningful as a reference for formal studies in the future, and thus, the techniques to discover such knowledge are highly required.</p>
      </sec>
      <sec>
        <title>Objectives</title>
        <p>To identify and summarize the key attributes of a new illness, in this study, we constructed a data analysis pipeline for the social media data analysis of BII. The pipeline incorporated natural language processing (NLP) and topic modeling methods. Our primary objective is to derive novel knowledge about BII, a medical condition that has not yet been systematically studied and defined in the medical literature, by constructing a data analysis pipeline and applying the pipeline to social media data. As medical knowledge and literature on BII have not been established and the related concepts are not well defined or accepted, using social media data to understand emerging issues could be a meaningful starting point. We applied this pipeline to better understand the symptoms and signs associated with BII. To the best of our knowledge, this study is the first to use social media data to derive the knowledge of BII from social media. This demonstrates the potential of using social media information to better understand the conditions that have primarily been reported on social media. It also establishes the effectiveness of our pipeline and its potential application to understand other new illnesses. In the following discussion, we have described our analysis pipeline in the context of BII. However, our pipeline is not specific to BII and is applicable to other illnesses as well.</p>
      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Data</title>
        <p>We collected and used data from select social media websites. These websites were selected because they were dedicated to BII discussions and information and were focused on user groups with interest in BII. Often, dedicated social media websites (eg, forums and Twitter pages) are available for a particular illness or disease. For example, some dedicated websites [<xref ref-type="bibr" rid="ref53">53</xref>-<xref ref-type="bibr" rid="ref55">55</xref>] contain the stories and experiences of patients fighting different cancers, some [<xref ref-type="bibr" rid="ref56">56</xref>,<xref ref-type="bibr" rid="ref57">57</xref>] contain posts and stories of users experiencing chronic pain and illness, and others [<xref ref-type="bibr" rid="ref58">58</xref>-<xref ref-type="bibr" rid="ref60">60</xref>] contain stories and experiences from COVID-19 survivors. The social media sources used in our study were as follows:</p>
        <list list-type="bullet">
          <list-item>
            <p>BII [<xref ref-type="bibr" rid="ref61">61</xref>]: This was a dedicated public website with articles on BII-related topics and offered resources related to implant and explant procedures, etc. This website also allowed individuals to post their experiences and concerns about breast implants and related health issues. We extracted individual posts from the website (up to May 10, 2019), and the resulting data set was referred to as BIIweb.</p>
          </list-item>
          <list-item>
            <p>Healing BII [<xref ref-type="bibr" rid="ref62">62</xref>]: This website contained information on postimplant disorders, postexplant healing, breast implant safety, etc. The discussion board of this website had multiple posts and comments on symptoms, signs, etc, which are experienced by individuals with a breast implant or by those who have undergone an explant. The data set extracted from the discussion board of this website (up to May 10, 2019) was referred to as HealingBII.</p>
          </list-item>
          <list-item>
            <p>Instagram posts about BII [<xref ref-type="bibr" rid="ref63">63</xref>]: This website contained a collection of publicly available Instagram posts that used <italic>breastimplantillness</italic> as a hashtag. We extracted the associated texts for each Instagram post with a timestamp between January 10, 2012, and September 4, 2019. The data set extracted from this site was referred to as IG-BII.</p>
          </list-item>
        </list>
        <p>All the comments and posts from the 3 websites were included in the corresponding data sets. <xref ref-type="table" rid="table1">Table 1</xref> presents a summary of the social media data collected. The BIIweb data set had only 187 posts (where each post on average has 129 words, SD 124) but these were larger (larger average length of posts in words) on average than those in the other 2 data sets. HealingBII was the second largest data set, with 1920 posts, each with 85 words on average (l<sub>avg</sub>) (SD 107). IG-BII was the largest data set, with 28,987 posts and 123 words per post on average (SD 113).</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Statistical summary of social media data analyzed.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="160"/>
            <col width="240"/>
            <col width="140"/>
            <col width="110"/>
            <col width="200"/>
            <col width="150"/>
            <thead>
              <tr valign="bottom">
                <td>Data set</td>
                <td>Posts<sup>a</sup> (n=31,094), n (%)</td>
                <td>l<sub>max</sub><sup>b</sup></td>
                <td>l<sub>min</sub><sup>c</sup></td>
                <td>l<sub>avg</sub><sup>d</sup>, mean (SD)</td>
                <td>Words<sup>e</sup>, n (%)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>BIIweb</td>
                <td>187 (0.6)</td>
                <td>669</td>
                <td>3</td>
                <td>129 (124)</td>
                <td>24,191 (0.64)</td>
              </tr>
              <tr valign="top">
                <td>HealingBII</td>
                <td>1920 (6.17)</td>
                <td>1330</td>
                <td>1</td>
                <td>85 (107)</td>
                <td>165,090 (4.38)</td>
              </tr>
              <tr valign="top">
                <td>IG-BII</td>
                <td>28,987 (93.22)</td>
                <td>515</td>
                <td>1</td>
                <td>123 (113)</td>
                <td>3,581,081 (94.98)</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>Posts: the number of posts and comments in the respective data sets.</p>
            </fn>
            <fn id="table1fn2">
              <p><sup>b</sup>l<sub>max</sub>: the minimum length of a post in words.</p>
            </fn>
            <fn id="table1fn3">
              <p><sup>c</sup>l<sub>min</sub>: the maximum length of a post in words.</p>
            </fn>
            <fn id="table1fn4">
              <p><sup>d</sup>l<sub>avg</sub>: the average length of posts in words.</p>
            </fn>
            <fn id="table1fn5">
              <p><sup>e</sup>Words: the total number of words in the respective data sets.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>The Pipeline</title>
        <sec>
          <title>Overview</title>
          <p><xref rid="figure1" ref-type="fig">Figure 1</xref> shows an overview of the pipeline. We extracted major topics of interest primarily related to symptoms, diseases, and medical procedures from our data sets through the following 3 steps. Each of the steps will be discussed in detail later. The first step involved data preprocessing. We removed all stop words, numeric characters, hyperlinks, hashtags, etc, and converted the remaining characters into lowercase. The second step was of mention extraction and concept mapping. We extracted mentions related to signs, symptoms, diseases, disorders, and medical procedures using the clinical Text Analysis and Knowledge Extraction System (cTAKES) [<xref ref-type="bibr" rid="ref64">64</xref>]. The extracted mentions were further mapped to standard medical concepts represented by concept unique identifiers (CUIs) in the unified medical language system (UMLS) [<xref ref-type="bibr" rid="ref65">65</xref>] ontology. The third step involved topic modeling. We summarized the mapped concepts to topics using latent Dirichlet allocation (LDA) [<xref ref-type="bibr" rid="ref66">66</xref>]. LDA is a probabilistic generative model for topic modeling. It represents each document as a mixture of latent topics, where each topic is modeled as a distribution over words. This modeling consisted of 3 stages: (1) mention replacement, (2) topic modeling using LDA, and (3) analysis and evaluation. In mention replacement, we replaced each extracted mention in the posts with its mapped CUIs and discarded all other words in the posts. We have discussed this step in more detail in the section <italic>Topic modeling</italic>. Then, in topic modeling using LDA, given the corpus of mapped CUIs, LDA generates document-topic and topics-CUI probability distributions. We have discussed this step in more detail in the section <italic>Topic modeling</italic>. Finally, during our analysis and evaluation, we further analyzed these distributions to derive a list of topics using the most representative mentions and summarized the extracted mentions for each data set. We have discussed this step in more detail in the section <italic>Results: LDA topics</italic>.</p>
          <fig id="figure1" position="float">
            <label>Figure 1</label>
            <caption>
              <p>Pipeline for breast implant illness social media analysis. ASCII: American standard code for information interchange; CUI: concept unique identifier; LDA: latent Dirichlet allocation; cTAKES: clinical Text Analysis and Knowledge Extraction System.</p>
            </caption>
            <graphic xlink:href="medinform_v9i11e29768_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
        <sec>
          <title>Data Preprocessing</title>
          <p>We used the Natural Language Toolkit tokenizer [<xref ref-type="bibr" rid="ref67">67</xref>] to tokenize the raw text for each data set. Out of the obtained tokens, we removed the stop-words (most frequently occurring, function words such as conjunctions, prepositions, determiners, etc) using the Natural Language Toolkit English stop-words list. As stop-words carried little or no information on our topics of interest in BII, they could be safely removed, as is typically done in NLP. We also removed all the numeric characters, emojis, non–American Standard Code for Information Interchange (ASCII) characters, hyperlinks, hashtags, and Instagram handles using regular expression matching and converted all the remaining tokens into lower cases to unify different cases for downstream processing.</p>
        </sec>
        <sec>
          <title>Mention Extraction and Concept Mapping</title>
          <p>Mention extraction refers to the extraction of words or phrases that convey a medical concept. We used the cTAKES tool for mention extraction. The cTAKES tool is an open-source NLP tool for clinical information extraction from unstructured clinical texts. cTAKES extracts mentions (ie, words or phrases that convey a medical concept) from posts and maps these mentions to standard medical concepts. In doing so, it also categorizes each extracted mention into one of 5 cTAKES categories: sign, symptom, disease, disorder, medication, procedure, and anatomy; that is, while cTAKES extracts mentions, it also automatically classifies the mentions into one of the 5 categories. For example, in the sentence “Over the years, my tinnitus has become worse to almost debilitating levels,” cTAKES extracts <italic>tinnitus</italic> as a mention of sign and symptom category. Below, we discuss how to configure the cTAKES in detail.</p>
          <p>We used the fast-dictionary-lookup annotator in cTAKES to extract mentions from the processed data. This annotator identifies and extracts mentions in texts and normalizes them into CUIs in the UMLS standard medical ontology. This normalization of extracted mentions into CUIs is referred to as concept mapping. Each CUI in the UMLS ontology uniquely identifies a medical concept. Hence, we represented extracted mentions using the standard medical concepts of CUIs that cTAKES maps the mentions to. We configured the annotator to use an exact string match and to use the all-term-persistence property. Thus, the annotator could retain all terms, irrespective of the semantic properties of each term. For example, for the phrase <italic>back pain</italic>, the annotator would annotate the generic term <italic>pain</italic> as well as the precise term <italic>back pain</italic>. We chose to use the all-term-persistence property to retain maximum information with respect to precise and generic medical concepts. Finally, the annotator stored the generated annotations in XML Metadata Interchange (XMI) files.</p>
          <p>To obtain the annotations in a human-readable format from the XMI files, we performed the following steps (<xref rid="figure2" ref-type="fig">Figure 2</xref>). We used a custom interpreter to process the XMI files produced by cTAKES and to obtain mappings between mentions and CUIs from cTAKES. We first searched for <italic>UmlsConcept</italic> XML identifiers in the XMI files, where each <italic>UmlsConcept</italic> XML identifier is generally grouped under the <italic>FSArray</italic>, and each <italic>FSArray</italic> is associated with a single ontology concept and the category of the concept. Each concept is assigned one category out of 5 cTAKES categories: sign, symptom, disease, disorder, medication, procedure, and anatomy. Each ontology concept is further associated with a UMLS CUI and an <italic>ontologyConceptArr</italic> identifier. It must be noted that a mention can be mapped to multiple CUIs. For example, the mention <italic>allergic reaction</italic> is categorized as sign and symptom but mapped to 2 different CUIs: <italic>C1527304</italic> and <italic>C0020517</italic>. Then, we extracted the ontology concepts that describe any of these categories: diseases, disorders, signs, symptoms, and medical procedures. Finally, we used the <italic>begin</italic> and <italic>end</italic> markers associated with each <italic>ontologyConceptArr</italic> identifier to obtain the position of the annotated mention in the input post. In this work, we were only interested in the first 3 categories (ie, sign, symptom, disease, disorder, and procedure) to understand BII-related issues. Hence, we only used the mentions categorized into either of these 3 categories.</p>
          <fig id="figure2" position="float">
            <label>Figure 2</label>
            <caption>
              <p>Pipeline for obtaining annotations out of Clinical text analysis and knowledge extraction system. cTAKES: clinical Text Analysis and Knowledge Extraction System; CUI: concept unique identifier; UMLS: unified medical language system.</p>
            </caption>
            <graphic xlink:href="medinform_v9i11e29768_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
        <sec>
          <title>Topic Modeling</title>
          <p>To conduct topic modeling, we processed the posts as follows: we substituted each mention in the posts with its mapped CUIs and discarded all other words in the posts, which were considered as nonmedical concepts by cTAKES or were not among the 3 categories of interest. If a mention was mapped to multiple CUIs, we replaced it with multiple CUIs. If multiple mentions were mapped to the same CUI, we replaced all such mentions with the CUI. In this way, each post was represented as a bag-of-CUI, instead of a collection of mentions, as the input to the topic modeling and our vocabulary consisted of CUIs. Upon topic modeling, we interpreted the topic-CUI distribution to derive the topics.</p>
          <p>We used LDA [<xref ref-type="bibr" rid="ref66">66</xref>] to learn the topic distributions of each post and the CUI distributions of each topic. LDA is a generative probabilistic model for modeling topics within a document corpus. LDA models each document in the corpus as a mixture of latent topics, where each topic is modeled as a distribution over words in all documents. LDA derives the optimal distributions by maximizing the likelihood of observing the corpus, following perspective distributions. A brief description of LDA is provided in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> [<xref ref-type="bibr" rid="ref66">66</xref>]. In our experiments, a bag-of-CUIs generated as described above was used as a document in LDA, and the CUIs were words in the document. We used the lda-c software [<xref ref-type="bibr" rid="ref68">68</xref>], which is a very efficient implementation of the LDA method, to conduct topic modeling.</p>
          <p>When LDA is used in topic modeling for general documents (eg, news, scientific literature), words and their frequencies in the documents are used. However, in our analysis, we aimed to understand the medical concepts related to BII from social media texts. Different words may indicate the same medical concepts. For example, joint aches, painful joints, arthralgia, and aching joints all indicate joint pain and are associated with a single medical concept represented by a single CUI. Therefore, instead of using words, we used medical concepts, represented by CUIs, in our LDA analysis. Because multiple words indicating the same medical concept can be mapped to the same CUI, using CUIs can also aggregate and strengthen the information from multiple words, compared with using words, which may be sparse and thus not easy to learn topics from.</p>
        </sec>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>cTAKES Annotations</title>
        <p><xref ref-type="table" rid="table2">Table 2</xref> presents the summary statistics for the annotated mentions and their CUIs mapped by cTAKES. In BIIweb, cTAKES extracted 2186 mentions and mapped them to 475 unique CUIs. In HealingBII, cTAKES extracted 11,080 mentions and mapped them to 1177 unique CUIs. In the largest data set IG-BII, cTAKES extracted 5530 unique mentions and mapped them to 2871 unique CUIs. Note that the same mention can be mapped to multiple CUIs and can have multiple categories (each CUI has only one category). For example, the mention <italic>flashes</italic> is mapped to 2 different CUIs and then 2 different categories: diseases and medical procedures. <xref ref-type="table" rid="table2">Table 2</xref> presents the statistics for each category of extracted mentions. For each data set, most of the extracted mentions were categorized as signs and symptoms by cTAKES.</p>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Statistical summary of annotations of the clinical Text Analysis and Knowledge Extraction System.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="130"/>
            <col width="120"/>
            <col width="110"/>
            <col width="90"/>
            <col width="80"/>
            <col width="80"/>
            <col width="80"/>
            <col width="80"/>
            <col width="80"/>
            <col width="80"/>
            <col width="70"/>
            <thead>
              <tr valign="bottom">
                <td>Data set</td>
                <td>cwords<sup>a</sup></td>
                <td>annots<sup>b</sup></td>
                <td>maps<sup>c</sup></td>
                <td>M<sup>d</sup></td>
                <td>C<sup>e</sup></td>
                <td>M/C<sup>f</sup></td>
                <td>C/M<sup>g</sup></td>
                <td>S<sup>h</sup></td>
                <td>D<sup>i</sup></td>
                <td>P<sup>j</sup></td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>BIIweb</td>
                <td>24,034</td>
                <td>2186</td>
                <td>661</td>
                <td>640</td>
                <td>475</td>
                <td>1.39</td>
                <td>1.03</td>
                <td>385</td>
                <td>149</td>
                <td>106</td>
              </tr>
              <tr valign="top">
                <td>HealingBII</td>
                <td>163,352</td>
                <td>11,080</td>
                <td>1740</td>
                <td>1685</td>
                <td>1177</td>
                <td>1.48</td>
                <td>1.03</td>
                <td>891</td>
                <td>503</td>
                <td>292</td>
              </tr>
              <tr valign="top">
                <td>IG-BII</td>
                <td>3,116,966</td>
                <td>185,339</td>
                <td>5694</td>
                <td>5530</td>
                <td>2871</td>
                <td>1.98</td>
                <td>1.03</td>
                <td>3049</td>
                <td>1549</td>
                <td>932</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table2fn1">
              <p><sup>a</sup>cwords: the total number of words recognized by the clinical Text Analysis and Knowledge Extraction System.</p>
            </fn>
            <fn id="table2fn2">
              <p><sup>b</sup>annots: the total number of extracted mentions belonging to the 3 semantic types (ie, signs, symptoms, diseases, disorders, and medical procedures).</p>
            </fn>
            <fn id="table2fn3">
              <p><sup>c</sup>maps: the number of unique mention–concept unique identifier mappings.</p>
            </fn>
            <fn id="table2fn4">
              <p><sup>d</sup>M: the number of unique extracted mentions.</p>
            </fn>
            <fn id="table2fn5">
              <p><sup>e</sup>C: the number of unique mapped concept unique identifiers.</p>
            </fn>
            <fn id="table2fn6">
              <p><sup>f</sup>M/C: the average number of extracted mentions mapped to a given concept unique identifier.</p>
            </fn>
            <fn id="table2fn7">
              <p><sup>g</sup>C/M: the average number of concept unique identifiers mapped to an extracted mention.</p>
            </fn>
            <fn id="table2fn8">
              <p><sup>h</sup>S: the number of unique extracted mentions mapped to the signs and symptoms category.</p>
            </fn>
            <fn id="table2fn9">
              <p><sup>i</sup>D: the number of unique extracted mentions that are mapped to the diseases and disorders category.</p>
            </fn>
            <fn id="table2fn10">
              <p><sup>j</sup>P: the number of unique extracted mentions mapped to the medical procedures category.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>To determine if cTAKES can sufficiently extract relevant mentions, we performed a manual annotation and compared the 2 lists of extracted mentions: one from using cTAKES and the other from using manual annotation. We randomly sampled 50 posts from each of the 3 data sets and manually annotated these posts. Upon manual annotation, we extracted mentions (words or phrases) that conveyed the concerns and experiences of social media users involving BII-related symptoms, diseases, and medical procedures. For a random sample of 50 posts (l<sub>avg</sub>=134.18) from BIIweb, we obtained a total of 575 mentions from using manual annotation, and 637 mentions using cTAKES; there were 479 common mentions. Each mention was associated with a post identifier and a character offset. A mention was considered to belong to both lists if it occurred in both lists with the same post identifier and character offset. We found that 83.3% (479/575) of manually annotated mentions were covered by cTAKES. This high coverage demonstrates that cTAKES can capture most of the relevant medical concepts. In contrast, 75.2% (479/637) of the annotated mentions by cTAKES were covered by manual annotation. This further demonstrates that most of the annotated mentions of cTAKES can be confirmed by manual annotation. Similarly, for a random sample of 50 posts (l<sub>avg</sub>=80.02) from HealingBII, 69.5% (194/279) of manually annotated mentions were covered by cTAKES; 70.3% (194/276) of mentions annotated by cTAKES were confirmed by manual annotation. For a random sample of 50 posts (l<sub>avg</sub>=121.00) from IG-BII, the corresponding values were 75.2% (182/242) and 64.3% (182/283), respectively. According to the high overlap in the results between manual annotation and cTAKES across multiple data sets used in our study, it is reasonable to assume that cTAKES is a decent surrogate of manual annotation for BII study through social media data.</p>
      </sec>
      <sec>
        <title>LDA Topics</title>
        <p>To identify the best topic models, we used a grid search to identify the best parameter values for the Dirichlet prior α ∈ {0.01,0.05,0.1,0.5,1,1.5,2,5,10,15,20,25} and the number of topics K ∈ {3,4,5,10,15,20}. To evaluate topic models, we analyzed each LDA topic modeling result for every combination of α and K values corresponding to low perplexity scores [<xref ref-type="bibr" rid="ref66">66</xref>,<xref ref-type="bibr" rid="ref69">69</xref>,<xref ref-type="bibr" rid="ref70">70</xref>].</p>
        <p>For each topic modeling result, we analyzed the document-topic and topic-CUI probability distributions to derive topics and their respective top 10 representative mentions. The top 10 representative mentions for a given topic were the most frequent mentions, corresponding to the top 10 CUIs, with the highest probabilities of belonging to the topic. Multiple mentions could be mapped to a given CUI (<xref ref-type="table" rid="table2">Table 2</xref>). We only presented the most frequent mention because all mentions mapped to the same CUI had similar semantics. We further evaluated the quality of topic modeling based on how well the derived topics summarized the most representative mentions. We analyzed each LDA topic modeling result for every combination of α and K and chose the one where the derived topics were distinct and best summarized the most representative mentions. Finally, we identified distinct and meaningful topics using (1) K=4 and α=10 for BIIweb, (2) K=5 and α=10 for HealingBII, and (3) K=5 and α=1.5 for IG-BII. We observed that with higher K values, the most representative mentions were similar across the topics. Hence, the derived topics were not distinct and were difficult to interpret.</p>
        <p><xref ref-type="table" rid="table3">Tables 3</xref>-<xref ref-type="table" rid="table5">5</xref> present the top 10 representative mentions, the frequencies of CUIs corresponding to the mentions (in %), and the interpretations of the topics indicated by the mentions (eg, common signs and symptoms). Note that the frequencies of CUIs are among all the posts, not only in those posts with the highest probability belonging to a certain topic. We presented these frequencies because each post had a certain probability of belonging to a certain topic, and thus frequencies among all posts would better represent the topic information across all the posts. These tables also present examples of posts that have a high probability of belonging to the respective topic. In the examples, the mentions that had high probabilities of belonging to the corresponding topics are italicized. Note that we used CUIs in LDA to derive the topic and word distributions (as discussed in the section Methods—Topic modeling), but we have presented the most frequent mentions (with clear semantics) that were mapped to the respective CUIs (which are identifiers without semantics) in these tables. The mentions in these tables were sorted based on the probabilities of their corresponding CUIs belonging to the respective topics. Please note that these probabilities have not been presented in the tables (they are not the frequencies presented in the tables). Therefore, each topic was represented by its most representative mentions, and thus, summarized such mentions. For example, we interpreted a topic as pain and other signs if there were a significant number of mentions related to pain, such as neck pain, chest pain, and headache. Please note that the topics have not been sorted, and the first columns in Tables 3 to 5 are nominal identifiers. Below, we have discussed the topics derived from LDA for BIIweb and HealingBII data sets from the original posts. Note that 2 topics can still share the same representative mention with different probabilities in the LDA.</p>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Derived topics in BIIweb.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="80"/>
            <col width="710"/>
            <col width="210"/>
            <thead>
              <tr valign="top">
                <td>Topic</td>
                <td>Top 10 mentions</td>
                <td>Interpretation</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>1</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Testing (2.34); illness (4.46); problem (2.82); work (1.17); swollen (0.78); drains (0.61); feel common (2.51); fatigue (1.82); exhausted (0.39); sensitivity (0.95)</p>
                    </list-item>
                    <list-item>
                      <p>Example: “I had silicone implants done 5 years ago, three years ago after going to the doctor with extreme <italic>fatigue</italic><sup>a</sup> (I was sleeping 14-16 hours a day and was still <italic>exhausted</italic>)”</p>
                    </list-item>
                  </list>
                </td>
                <td>Common signs and symptoms</td>
              </tr>
              <tr valign="top">
                <td>2</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Breast implant (6.80); removal (1.30); cancer (0.95); autoimmune (0.95); infection (0.87); scleroderma (0.39); pain (3.68); diagnosis (0.30); alcl (0.30); breast cancer (0.30)</p>
                    </list-item>
                    <list-item>
                      <p>Example: “I had stage 4 breast <italic>cancer</italic> and had chemo and radiation. I tried to have my <italic>breast implants</italic> removed due to <italic>pain</italic>...Then I had an acute <italic>infection</italic> occur a month and a half after they put the new implants in and they were forced to perform an emergency <italic>removal</italic> of the newer implants. I have had all the symptoms of breast implant illness—even after their removal.”</p>
                    </list-item>
                  </list>
                </td>
                <td>Diseases or disorders</td>
              </tr>
              <tr valign="top">
                <td>3</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Breast implant (6.80); illness (4.46); toxicity (1.17); foreign body (0.87); heal (0.78); support (0.65); rupture (0.52); cancer (0.95); awareness (0.35); inflammation (0.56)</p>
                    </list-item>
                    <list-item>
                      <p>Example: “...I never had a problem until 2006 at which time I thought something had happened however, my surgeon said I must have just pulled a muscle and that the <italic>implants</italic> seemed fine. Now that surgeon is old and the shop is closed up. I have been suffering for the past 13 years with arthritis, fatigue, brain fog, <italic>inflammation</italic>, hormone imbalances, and adrenal fatigue...”</p>
                    </list-item>
                  </list>
                </td>
                <td>Toxicity</td>
              </tr>
              <tr valign="top">
                <td>4</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Pain (3.68); feel (2.51); fatigue (1.82); back pain (0.87); illness (4.46); joint pain (0.56); worse (0.65); anxiety (0.52); ear ringing (0.39); headache (0.39)</p>
                    </list-item>
                    <list-item>
                      <p>Example: “It wasn’t until 2017 where I started to experience <italic>anxiety</italic> and panic attacks (which I didn’t know I was having at the time). With that, along came crazy <italic>headaches</italic>, feeling dizzy, sick, lightheaded, and my right eye would always be swollen and never knew why.”</p>
                    </list-item>
                  </list>
                </td>
                <td>Pain and stress-related disorders</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table3fn1">
              <p><sup>a</sup>The mentions in the examples that had high probabilities of belonging to the corresponding topics are italicized.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <table-wrap position="float" id="table4">
          <label>Table 4</label>
          <caption>
            <p>Derived topics in HealingBII.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="80"/>
            <col width="710"/>
            <col width="210"/>
            <thead>
              <tr valign="top">
                <td>Topic</td>
                <td>Top 10 mentions</td>
                <td>Interpretation</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>1</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Rupture (1.34); supported (0.87); read (1.17); suffering (0.87); happy (0.6); mastectomy (0.46); work (0.96); scare (0.77); reconstruction (0.41); mri (0.72)</p>
                    </list-item>
                    <list-item>
                      <p>Example: “Double <italic>mastectomy</italic><sup>a</sup> in 2015. <italic>Reconstruction</italic> process with expanders then permanent 1000 ml saline implants in early 2016. After that was 9 procedures, a hysterectomy and now MANY health problems.”</p>
                    </list-item>
                  </list>
                </td>
                <td>Surgeries and procedures</td>
              </tr>
              <tr valign="top">
                <td>2</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Pain (3.91); joint pain (0.79); fatigued (0.96); ailment (4.70); removal (0.84); hair loss (0.52); headache (0.47); muscle ache (0.34); rash (0.39); infection (0.84)</p>
                    </list-item>
                    <list-item>
                      <p>Example: “In addition to the neuromuscular spasms and <italic>pain</italic>, I’ve suffered with incapacitating chronic <italic>fatigue</italic>, BRAIN FOG and confusion (yes, even while driving), loss of vision and hearing, vertigo, mysterious skin <italic>rashes, hair loss, migraines...</italic>”</p>
                    </list-item>
                  </list>
                </td>
                <td>Pain and other signs</td>
              </tr>
              <tr valign="top">
                <td>3</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Problem (2.64); cancer (0.90); autoimmune (0.57); breast cancer (0.38); scars (0.35); treatment (0.43); diagnose (0.29); autoimmune disorder (0.27); lupus (0.29); arthritis (0.26)</p>
                    </list-item>
                    <list-item>
                      <p>Example: “I had capsules form on both breasts from about 2010. I got sick with BII symptoms from 2005 with lots of infections required intravenous and oral antibiotics. My environmental and drug allergies got worse, onset of <italic>arthritis</italic>, skin rashes, <italic>autoimmune</italic> symptoms, started growing low grade <italic>cancers...</italic>”</p>
                    </list-item>
                  </list>
                </td>
                <td>Cancer and other disorders</td>
              </tr>
              <tr valign="top">
                <td>4</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Breast implant (3.85); ailment (4.70); toxicity (3.05); healing (1.56); capsulectomy (0.64); infection (0.84); inflammation (0.39); detoxification (0.32); foreign object (0.25); bleed (0.23)</p>
                    </list-item>
                    <list-item>
                      <p>Example: “Some women with silicone <italic>toxicity</italic> have bruising and <italic>bleeding</italic> problems. If I was you, I would try and have the lymph node localized and checked for silicone and removed if it is contaminated beyond detoxing much like a silicone granuloma is removed.”</p>
                    </list-item>
                  </list>
                </td>
                <td>Toxicity</td>
              </tr>
              <tr valign="top">
                <td>5</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Emotion (3.70); think (2.26); feel (0.84); normal (0.65); anxiety (0.50); ill (0.61); sensation (0.33); tired (0.28); sores (0.27); depression (0.33)</p>
                    </list-item>
                    <list-item>
                      <p>Example: “Even more heartbreaking and discouraging, has been the <italic>emotional</italic> pain of not being able to freely play with her on the floor due to hip and knee pain, along with leg and foot spasms...but I struggle with many <italic>feelings</italic> of failure as a wife and mother due to physical limitations.”</p>
                    </list-item>
                  </list>
                </td>
                <td>Mental health</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table4fn1">
              <p><sup>a</sup>Italic text indicates the mentions in the examples that had high probability of belonging to the corresponding topics.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <table-wrap position="float" id="table5">
          <label>Table 5</label>
          <caption>
            <p>Derived topics in IG-BII.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="80"/>
            <col width="710"/>
            <col width="210"/>
            <thead>
              <tr valign="top">
                <td>Topic</td>
                <td>Top 10 mentions</td>
                <td>Interpretation</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>1</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Heal (1.46); working (0.90); weighted (1.05); able (0.99); rest (0.37); stress (0.29); exercise (0.28); therapeutic (0.35); sleep (0.36); run (0.23)</p>
                    </list-item>
                    <list-item>
                      <p>Example: “It’s been 14 months since my explant. The journey to <italic>healing</italic><sup>a</sup> hasn’t been an easy one due to setbacks and relapses but better than daily anaphylaxis from getting cold, food, smells, crying, <italic>exercise</italic> and <italic>stress</italic>, then add angina attacks from anaphylaxis.”</p>
                    </list-item>
                  </list>
                </td>
                <td>Physical health</td>
              </tr>
              <tr valign="top">
                <td>2</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Malignancy (1.10); removal (0.96); scar (0.75); capsulectomy (0.68); rupture (0.43); ciactrice (0.43); alcl (0.41); augmentation (0.37); lymphoma (0.35); removal of implants (0.29)</p>
                    </list-item>
                    <list-item>
                      <p>Example: “The ugly side of breast implants. It’s not a matter of IF you will get sick...it’s WHEN. implants leak toxic heavy metals without rupture It’s called a gel bleed. Women with implants are 3 times more likely to develop brain, lung and <italic>lymphatic cancer</italic> than women with implants.”</p>
                    </list-item>
                  </list>
                </td>
                <td>Cancer and medical procedures</td>
              </tr>
              <tr valign="top">
                <td>3</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Loving (2.43); happiness (2.11); emotion (1.64); think (1.05); feel (0.87); scare (0.55); confidence (0.35); tired (0.38); emotional (0.27); sensation (0.33)</p>
                    </list-item>
                    <list-item>
                      <p>Example: “I was <italic>scared</italic> of looking incomplete. After much deep, inner work on myself, I realized that my worth wasn’t dependent on what I looked like or how big my chest was. I realized that true <italic>happiness</italic> would come from 100% acceptance of what and who I was”</p>
                    </list-item>
                  </list>
                </td>
                <td>Mental health</td>
              </tr>
              <tr valign="top">
                <td>4</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Breast implant (7.21); ailment (5.67); toxicity (1.67); aware (0.96); felt worse (0.36); test (0.64); foreign body (0.45); alone (0.33); suffering (0.21); complication (0.20)</p>
                    </list-item>
                    <list-item>
                      <p>Example: “...We get <italic>toxic</italic> from the chemical makeup of the silicone, the <italic>toxic</italic> chemicals that are released when the shell degrades, sick from rupture and sometimes mold.”</p>
                    </list-item>
                  </list>
                </td>
                <td>Toxicity</td>
              </tr>
              <tr valign="top">
                <td>5</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Pain (2.52); inflammatory reaction (0.89); fatigue (0.83); anxiousness (0.72); allergy (0.43); depression (0.37); joint pain (0.33); autoimmune disorder (0.32); swell (0.43); infection (0.31)</p>
                    </list-item>
                    <list-item>
                      <p>Example: “For three years, doctors have been unable to diagnose or explain upper body weakness, hand <italic>pain</italic>, and general <italic>inflammation</italic>. I have suffered from periods of high <italic>inflammation</italic>, debilitating <italic>fatigue</italic>, migraines, inability to lose weight, insomnia, low libido, body and <italic>joint pain</italic>, hair loss, dry skin, dry eyes, brain fog, etc.”</p>
                    </list-item>
                  </list>
                </td>
                <td>Common disorders</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table5fn1">
              <p><sup>a</sup>Italic text indicates the mentions in the examples that had high probability of belonging to the corresponding topics.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p><xref ref-type="table" rid="table3">Table 3</xref> presents the topics in the data set BIIweb data set. Although BIIweb was the smallest the data set (<xref ref-type="table" rid="table1">Table 1</xref>), we were still able to identify 4 distinct topics with the most representative mentions, namely, fatigue, infection, toxicity, and anxiety. <xref ref-type="table" rid="table4">Table 4</xref> presents the topics in the data set HealingBII, which shared some common topics and representative mentions with those in BIIweb. For example, pain, cancer, and toxicity were common across these 2 data sets. However, a focused topic unique to HealingBII was surgeries and procedures, where people (mostly patients) discuss the procedures among themselves and share their related experiences. Another unique topic in HealingBII was mental health.</p>
        <p>In addition to physical symptoms, individuals reported significant emotional and mental difficulties, such as depression, and expressed serious symptoms on social media. <xref ref-type="table" rid="table5">Table 5</xref> presents the topics in the data set IG-BII data set. IG-BII was the largest data set (<xref ref-type="table" rid="table1">Table 1</xref>) and had significantly more posts than the other two. We observed that cancers, mental health, and toxicity emerged as significant topics in this large data set, consistent with those in HealingBII. In IG-BII, people also discussed their recovery process from the issues or events associated with BII. We identified from these 3 data sets frequent mentions of rupture, pains, and fatigue. We also identified mentions of cancer, lupus, and autoimmune disorders. Please note that <xref ref-type="table" rid="table3">Table 3</xref> contains 4 topics for BIIweb, but <xref ref-type="table" rid="table4">Tables 4</xref> and <xref ref-type="table" rid="table5">5</xref> contain 5 topics for HealingBII and IG-BII, respectively. This is because the number of topics was determined by how distinct the topics were, not by the prespecified number of topics.</p>
        <p><xref ref-type="table" rid="table6">Table 6</xref> presents the top 10 representative mentions, the frequencies of CUIs corresponding to the mentions (in %), and interpretations of the topics on the unified data set, combining all 3 data sets BIIweb, HealingBII, and IG-BII. We obtained a unified data set by combining all the posts from the 3 data sets into one corpus. To perform topic modeling, we processed the posts in the unified data set in the same way as we processed the posts in the individual data sets (discussed in the section Methods—Topic modeling). Upon topic modeling, we identified 5 distinct topics using K=5 and α=1.5. We observed that physical health, cancers, mental health, toxicity, and common disorders emerged as significant topics in the unified data set, consistent with those in IG-BII. This was because IG-BII was the largest data set out of the three and comprised 93.22% (28,987/31,094) of the unified data set. We also identified common concerns such as pain, allergy, depression, weight gain, cancer, inflammation, and toxicity issues from the individual and unified data sets. This implies that the above-mentioned factors were frequently associated with BII.</p>
        <table-wrap position="float" id="table6">
          <label>Table 6</label>
          <caption>
            <p>Derived topics in the unified data set.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="80"/>
            <col width="710"/>
            <col width="210"/>
            <thead>
              <tr valign="top">
                <td>Topic</td>
                <td>Top 10 mentions</td>
                <td>Interpretation</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>1</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Working (1.45); ate (0.92); weight (0.79); runs (0.40); thinking (2.68); exercise (0.25); talk (0.50); walking (0.35); nutrition (0.15); move (0.28);</p>
                    </list-item>
                    <list-item>
                      <p>Example: “...I’m now healthier than I have been in the last 7 years of my life!...I explanted in Feb of 2018, a few months after explant, I gained my <italic>weight</italic><sup>a</sup> back and found a love for true self care and <italic>working</italic> out.”</p>
                    </list-item>
                  </list>
                </td>
                <td>Physical health</td>
              </tr>
              <tr valign="top">
                <td>2</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Illnesses (4.45); cancer (0.87); ruptures (0.77); removal (0.76); awareness (0.73); suffers (0.83); capsulectomy (0.54); autoimmune (0.52); breast augmentation (0.30); augmentation (0.28);</p>
                    </list-item>
                    <list-item>
                      <p>Example: “I was diagnosed with breast <italic>cancer</italic> at the young age of 30 and ended up with a double mastectomy as part of that process...now 10 years later I have just 15 weeks ago had my implants removed. They had <italic>ruptured</italic>, were toxic and giving me health issues”</p>
                    </list-item>
                  </list>
                </td>
                <td>Cancer and medical procedures</td>
              </tr>
              <tr valign="top">
                <td>3</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Feel (5.94); loved (2.97); thinking (2.68); happier (1.64); feelings (1.47); afraid (0.66); confidence (0.27); support (0.79); able (0.77); alive (0.17);</p>
                    </list-item>
                    <list-item>
                      <p>Example: “When I found out I was sick and I had to tear apart my body to get better I never thought I’d be happy with myself again. I am 4 weeks post op and <italic>feeling</italic> more happy and healthy than ever. I was worried I’d never be <italic>loved</italic> again.”</p>
                    </list-item>
                  </list>
                </td>
                <td>Mental health</td>
              </tr>
              <tr valign="top">
                <td>4</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Heal (2.26); scars (0.58); scarred (0.33); drain (0.26); toxic (1.97); sights (1.25); inflammation (0.68); bulge (0.36); tenderness (0.20); red (0.15); damage (0.16);</p>
                    </list-item>
                    <list-item>
                      <p>Example: “I was so worried about how <italic>red</italic> and raised up my <italic>scars</italic> were...then they got really inflamed, sore and raised up around 3 weeks and i was really stressed over it. then overnight the <italic>inflammation</italic> and redness went down...”</p>
                    </list-item>
                  </list>
                </td>
                <td>Common signs, symptoms, and toxicity</td>
              </tr>
              <tr valign="top">
                <td>5</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Pain (2.09); tired all the time (0.69); anxiety (0.57); joint pain (0.46); alopecia (0.39); weight gain (0.37); allergies (0.35); depression (0.29); pain back (0.23); headache (0.22)</p>
                    </list-item>
                    <list-item>
                      <p>Example: “Before I had the explant, I had many unexplained symptoms (brain fog, <italic>joint pain</italic>, back and neck pain, <italic>tired all the time</italic>, psoriasis, afib, just to mention a few) since I awoke from surgery I have had absolutely no neck, back, or joint pain.”</p>
                    </list-item>
                  </list>
                </td>
                <td>Common disorders</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table6fn1">
              <p><sup>a</sup>Italic text indicates the mentions in the examples that had high probability of belonging to the corresponding topics.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p><xref ref-type="table" rid="table7">Table 7</xref> presents the percentage of posts per topic, where a post <italic>d</italic> is considered to belong to a topic z if among all topics that <italic>d</italic> has, z has the highest probability. Although the distributions are not completely consistent across data sets, toxicity remained a notable topic among all data sets. This indicates that these were common issues that were significantly associated with BII. In addition, pain, cancer, mental health, and other disorders were also associated with breast implants.</p>
        <table-wrap position="float" id="table7">
          <label>Table 7</label>
          <caption>
            <p>Distribution of posts among the topics.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="670"/>
            <col width="300"/>
            <thead>
              <tr valign="top">
                <td colspan="2">Data set and topics</td>
                <td>Posts, n (%)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="3">
                  <bold>BIIweb</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Common signs and symptoms</td>
                <td>62 (33.2)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Diseases or disorders</td>
                <td>28 (15)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Toxicity</td>
                <td>50 (26.7)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Pain and stress-related disorders</td>
                <td>47 (25.1)</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>HealingBII</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Surgeries and procedures</td>
                <td>713 (37.1)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Pain and other signs</td>
                <td>221 (11.5)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Cancer and other disorders</td>
                <td>221 (11.5)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Toxicity</td>
                <td>505 (26.3)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Mental health</td>
                <td>260 (13.6)</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>IG-BII</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Physical health</td>
                <td>11,299 (39)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Cancer and medical procedures</td>
                <td>3890 (13.4)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Mental health</td>
                <td>4879 (16.8)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Toxicity</td>
                <td>5415 (18.7)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Common disorders</td>
                <td>3504 (12.1)</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Unified</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Physical health</td>
                <td>4760 (15.3)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Cancer and medical procedures</td>
                <td>10,637 (34.2)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Mental health</td>
                <td>7954 (25.6)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Common signs, symptoms, and toxicity</td>
                <td>4030 (13)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Common disorders</td>
                <td>3713 (11.9)</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>To understand the signs, symptoms, and diseases or disorders associated with BII, a condition reported primarily on social media rather than in medical reports, we collected social media posts and analyzed them using NLP and topic modeling. We extracted mentions related to signs, symptoms, diseases, disorders, and medical procedures using cTAKES, mapped them to standard medical concepts, and summarized the mapped concepts to topics using LDA. We found that mentions such as rupture, infection, inflammation, pain, and fatigue were common self-reported issues. We also found that mental health–related concerns such as stress, anxiety, and depression, as well as diseases such as cancers and autoimmune disorders, were common concerns. The cTAKES was able to extract medication and anatomy information as well, but they were not used in our LDA analysis, given that the objective of our study was not to study the medications used or the anatomy related to BII.</p>
        <p>In our method, we relied on cTAKES and the rich UMLS dictionary to extract all relevant mentions, including their lexical variants (synonyms, abbreviations, paraphrases). To determine if cTAKES could sufficiently extract relevant mentions, we performed a manual annotation to extract all the relevant mentions and compared them with the extracted mentions from cTAKES. We found that cTAKES could sufficiently capture relevant medical concepts and was comparable with manual annotation. It is worth noting that we did not evaluate the performance of our mention extraction module on all the posts of each data set, which is typically performed using precision and recall metrics when there are ground-truth labels associated with each mention. However, in order to have such labels, careful manual annotations based on domain knowledge of BII are required. Unfortunately, such domain knowledge on complications, symptoms, and other issues associated with or caused by BII were not fully available. Our goal in this study is to provide useful information from social media data that could complement our current knowledge. Therefore, in this preliminary study, we used all annotated mentions, assuming that cTAKES enabled high-quality annotations.</p>
      </sec>
      <sec>
        <title>Strengths and Limitations</title>
        <p>We acknowledge that cTAKES might not have been able to extract all relevant mentions from our social media data sets. This is because cTAKES was originally designed for extraction of medical entities from clinical notes, which have very different wording and writing styles compared with social media data. As social media data comprise informal phrases, short ambiguous texts, emoticons, and a wide range of lexical variants corresponding to a single concept, cTAKES might not work flawlessly on social media data, although we observed reasonable output from cTAKES. We also observed that cTAKES often associated a single mention with multiple CUIs belonging to the same category. We think this was because of the presence of multiple mappings for a given mention in the UMLS metathesaurus. Regardless, the extracted mentions and the mapping of mentions to UMLS CUIs, as generated by cTAKES, were used for topic modeling without any manual verification or evaluation. In the future, we will develop a detailed guideline to further evaluate the extracted mentions before using them in topic modeling.</p>
        <p>Our study had some limitations. First, LDA is an unsupervised learning technique in which the number of topics (K) is assumed to be known a priori. However, it is difficult to accurately estimate K for a given data set. In our study, we used a grid search to obtain different K values. Even without full domain knowledge, it remains nontrivial to evaluate the LDA results for each K value. In our study, we selected the topics based on α and K values. We did not use perplexity [<xref ref-type="bibr" rid="ref66">66</xref>,<xref ref-type="bibr" rid="ref69">69</xref>,<xref ref-type="bibr" rid="ref70">70</xref>], a widely used metric in topic modeling, to select the topics, because as studied in the literature (eg, Chang et al [<xref ref-type="bibr" rid="ref71">71</xref>]), perplexity often does not correlate well with topic interpretability; in our case, the lowest perplexity did not always enable intuitive or meaningful topics. In the future, we will develop more rigorous ways to select the number of topics and evaluate the topic modeling results. In this study, we did not conduct a sentiment analysis of the posts to understand the positive or negative opinions expressed in the posts. We plan to include this process before topic modeling to generate a cleaner data set for topic modeling.</p>
        <p>It is worth noting that social media data could be of variable quality (eg, misspelling, misconception, and biased opinions), particularly compared with medical literature data. Anyone can post on social media, and so the derived content may be from individuals who may have other implant-specific issues such as capsular contracture or implant infection. Thus, understanding the diseases, disorders, symptoms, signs, etc, associated with a drug, disease, or medical procedure from social media data would always be at risk from confounders or errors. However, given that the medical knowledge and literature on BII have not been well established, and the related concepts are not well defined or well accepted, using social media data to understand emerging issues could be a meaningful starting point. Still, any findings from social media data would require a rigorous evaluation and validation based on medical and biological knowledge, experiments, clinical practice, etc. In addition, we have only analyzed 3, though the most relevant and prolific websites dedicated to BII discussions. A more comprehensive analysis of social media data on a much larger scale would be beneficial to better understand BII in a larger, diverse population. Sentiment analysis of social media data could be another valuable analysis to enable more insights into the health experiences of users or patients and their emotions or feelings. We will consider sentiment analysis in our future research when BII is better understood, and we can accurately annotate social media data.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>This study has important implications for future methodological and clinical research. Future methodological research on NLP could include causality inference between BII and symptom and sign mentions from social media to understand their relations, etc. Our findings could provide the relevant domains for clinical research studies seeking to develop measures of BII and to identify its causes. More specifically, our results can provide a patient-derived definition of BII, which can be useful to clinicians treating patients with BII concerns to use this patient-centered language. Our methods and informatics strategies applied in this study would also provide working examples for analyzing other emerging but not well-defined illnesses from social media data.</p>
        <p>Our analysis of social media data identified mentions such as rupture, infection, inflammation, pain, and fatigue, which were common self-reported issues on social media sites dedicated to BII. In addition, our analysis showed that a significant number of user comments and posts were also concerned with mental and physical health and toxicity issues after having breast implants. The findings from our study could be used to further the scientific study of BII, as well as the care of patients presenting with the described symptoms, by allowing clinicians to develop a patient-centered language to better approach the patients with concerns. Our study provides the first analysis and derived knowledge of BII from social media using NLP techniques and demonstrates the potential of using social media information to better understand emerging illnesses.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>A brief description of latent Dirichlet allocation.</p>
        <media xlink:href="medinform_v9i11e29768_app1.docx" xlink:title="DOCX File , 53 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">ASCII</term>
          <def>
            <p>American Standard Code for Information Interchange</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">BII</term>
          <def>
            <p>breast implant illness</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">cTAKES</term>
          <def>
            <p>clinical Text Analysis and Knowledge Extraction System</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">CUI</term>
          <def>
            <p>concept unique identifier</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">LDA</term>
          <def>
            <p>latent Dirichlet allocation</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">NLP</term>
          <def>
            <p>natural language processing</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">UMLS</term>
          <def>
            <p>unified medical language system</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">XMI</term>
          <def>
            <p>XML metadata interchange</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>XN conceived the research, obtained funding for the research, and supervised VD; PK, MN, and CL provided substantial medical background and insights; Vishal Dey and Xia Ning conducted the research, including data curation, methodology design and implementation, and analysis; Vishal Dey drafted the original manuscript; Vishal Dey and Xia Ning conducted the manuscript editing; PK, MN, and CL reviewed the manuscript and provided constructive suggestions and feedback.</p>
    </ack>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Barros</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Duggan</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Rebholz-Schuhmann</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>The application of internet-based sources for public health surveillance (Infoveillance): systematic review</article-title>
          <source>J Med Internet Res</source>
          <year>2020</year>
          <month>03</month>
          <day>13</day>
          <volume>22</volume>
          <issue>3</issue>
          <fpage>e13680</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2020/3/e13680/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/13680</pub-id>
          <pub-id pub-id-type="medline">32167477</pub-id>
          <pub-id pub-id-type="pii">v22i3e13680</pub-id>
          <pub-id pub-id-type="pmcid">PMC7101503</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Schillinger</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Chittamuru</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Ramírez</surname>
              <given-names>AS</given-names>
            </name>
          </person-group>
          <article-title>From "Infodemics" to health promotion: a novel framework for the role of social media in public health</article-title>
          <source>Am J Public Health</source>
          <year>2020</year>
          <month>09</month>
          <volume>110</volume>
          <issue>9</issue>
          <fpage>1393</fpage>
          <lpage>6</lpage>
          <pub-id pub-id-type="doi">10.2105/AJPH.2020.305746</pub-id>
          <pub-id pub-id-type="medline">32552021</pub-id>
          <pub-id pub-id-type="pmcid">PMC7427212</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Chaudhary</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>Modeling spatiotemporal pattern of depressive symptoms caused by COVID-19 using social media data mining</article-title>
          <source>Int J Environ Res Public Health</source>
          <year>2020</year>
          <month>07</month>
          <day>10</day>
          <volume>17</volume>
          <issue>14</issue>
          <fpage>4988</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=ijerph17144988"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/ijerph17144988</pub-id>
          <pub-id pub-id-type="medline">32664388</pub-id>
          <pub-id pub-id-type="pii">ijerph17144988</pub-id>
          <pub-id pub-id-type="pmcid">PMC7400345</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shen</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Luo</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Feng</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Liao</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>Using reports of symptoms and diagnoses on social media to predict COVID-19 case counts in mainland china: observational infoveillance study</article-title>
          <source>J Med Internet Res</source>
          <year>2020</year>
          <month>05</month>
          <day>28</day>
          <volume>22</volume>
          <issue>5</issue>
          <fpage>e19421</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2020/5/e19421/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/19421</pub-id>
          <pub-id pub-id-type="medline">32452804</pub-id>
          <pub-id pub-id-type="pii">v22i5e19421</pub-id>
          <pub-id pub-id-type="pmcid">PMC7257484</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Aiello</surname>
              <given-names>AE</given-names>
            </name>
            <name name-style="western">
              <surname>Renson</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Zivich</surname>
              <given-names>PN</given-names>
            </name>
          </person-group>
          <article-title>Social media- and internet-based disease surveillance for public health</article-title>
          <source>Annu Rev Public Health</source>
          <year>2020</year>
          <month>04</month>
          <day>02</day>
          <volume>41</volume>
          <fpage>101</fpage>
          <lpage>18</lpage>
          <pub-id pub-id-type="doi">10.1146/annurev-publhealth-040119-094402</pub-id>
          <pub-id pub-id-type="medline">31905322</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>LJ</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Pang</surname>
              <given-names>CP</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Retrospective analysis of the possibility of predicting the COVID-19 outbreak from Internet searches and social media data, China, 2020</article-title>
          <source>Euro Surveill</source>
          <year>2020</year>
          <month>03</month>
          <volume>25</volume>
          <issue>10</issue>
          <fpage>2000199</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.eurosurveillance.org/content/10.2807/1560-7917.ES.2020.25.10.2000199"/>
          </comment>
          <pub-id pub-id-type="doi">10.2807/1560-7917.ES.2020.25.10.2000199</pub-id>
          <pub-id pub-id-type="medline">32183935</pub-id>
          <pub-id pub-id-type="pmcid">PMC7078825</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ginsberg</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Mohebbi</surname>
              <given-names>MH</given-names>
            </name>
            <name name-style="western">
              <surname>Patel</surname>
              <given-names>RS</given-names>
            </name>
            <name name-style="western">
              <surname>Brammer</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Smolinski</surname>
              <given-names>MS</given-names>
            </name>
            <name name-style="western">
              <surname>Brilliant</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Detecting influenza epidemics using search engine query data</article-title>
          <source>Nature</source>
          <year>2009</year>
          <month>02</month>
          <day>19</day>
          <volume>457</volume>
          <issue>7232</issue>
          <fpage>1012</fpage>
          <lpage>4</lpage>
          <pub-id pub-id-type="doi">10.1038/nature07634</pub-id>
          <pub-id pub-id-type="medline">19020500</pub-id>
          <pub-id pub-id-type="pii">nature07634</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Naslund</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Grande</surname>
              <given-names>SW</given-names>
            </name>
            <name name-style="western">
              <surname>Aschbrenner</surname>
              <given-names>KA</given-names>
            </name>
            <name name-style="western">
              <surname>Elwyn</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Naturally occurring peer support through social media: the experiences of individuals with severe mental illness using YouTube</article-title>
          <source>PLoS One</source>
          <year>2014</year>
          <volume>9</volume>
          <issue>10</issue>
          <fpage>e110171</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pone.0110171"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0110171</pub-id>
          <pub-id pub-id-type="medline">25333470</pub-id>
          <pub-id pub-id-type="pii">PONE-D-14-24033</pub-id>
          <pub-id pub-id-type="pmcid">PMC4198188</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Foufi</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Timakum</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Gaudet-Blavignac</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Lovis</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Song</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Mining of textual health information from reddit: analysis of chronic diseases with extracted entities and their relations</article-title>
          <source>J Med Internet Res</source>
          <year>2019</year>
          <month>06</month>
          <day>13</day>
          <volume>21</volume>
          <issue>6</issue>
          <fpage>e12876</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2019/6/e12876/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/12876</pub-id>
          <pub-id pub-id-type="medline">31199327</pub-id>
          <pub-id pub-id-type="pii">v21i6e12876</pub-id>
          <pub-id pub-id-type="pmcid">PMC6595941</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wakamiya</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Morita</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kano</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Ohkuma</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Aramaki</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Tweet classification toward twitter-based disease surveillance: new data, methods, and evaluations</article-title>
          <source>J Med Internet Res</source>
          <year>2019</year>
          <month>02</month>
          <day>20</day>
          <volume>21</volume>
          <issue>2</issue>
          <fpage>e12783</fpage>
          <pub-id pub-id-type="doi">10.2196/12783</pub-id>
          <pub-id pub-id-type="medline">30785407</pub-id>
          <pub-id pub-id-type="pii">v21i2e12783</pub-id>
          <pub-id pub-id-type="pmcid">PMC6401666</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Attai</surname>
              <given-names>DJ</given-names>
            </name>
            <name name-style="western">
              <surname>Cowher</surname>
              <given-names>MS</given-names>
            </name>
            <name name-style="western">
              <surname>Al-Hamadani</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Schoger</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Staley</surname>
              <given-names>AC</given-names>
            </name>
            <name name-style="western">
              <surname>Landercasper</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Twitter social media is an effective tool for breast cancer patient education and support: patient-reported outcomes by survey</article-title>
          <source>J Med Internet Res</source>
          <year>2015</year>
          <volume>17</volume>
          <issue>7</issue>
          <fpage>e188</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.jmir.org/2015/7/e188/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/jmir.4721</pub-id>
          <pub-id pub-id-type="medline">26228234</pub-id>
          <pub-id pub-id-type="pii">v17i7e188</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Osadchiy</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Mills</surname>
              <given-names>JN</given-names>
            </name>
            <name name-style="western">
              <surname>Eleswarapu</surname>
              <given-names>SV</given-names>
            </name>
          </person-group>
          <article-title>Understanding patient anxieties in the social media era: qualitative analysis and natural language processing of an online male infertility community</article-title>
          <source>J Med Internet Res</source>
          <year>2020</year>
          <month>03</month>
          <day>10</day>
          <volume>22</volume>
          <issue>3</issue>
          <fpage>e16728</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2020/3/e16728/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/16728</pub-id>
          <pub-id pub-id-type="medline">32154785</pub-id>
          <pub-id pub-id-type="pii">v22i3e16728</pub-id>
          <pub-id pub-id-type="pmcid">PMC7093775</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nobles</surname>
              <given-names>AL</given-names>
            </name>
            <name name-style="western">
              <surname>Leas</surname>
              <given-names>EC</given-names>
            </name>
            <name name-style="western">
              <surname>Althouse</surname>
              <given-names>BM</given-names>
            </name>
            <name name-style="western">
              <surname>Dredze</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Longhurst</surname>
              <given-names>CA</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>DM</given-names>
            </name>
            <name name-style="western">
              <surname>Ayers</surname>
              <given-names>JW</given-names>
            </name>
          </person-group>
          <article-title>Requests for diagnoses of sexually transmitted diseases on a social media platform</article-title>
          <source>J Am Med Assoc</source>
          <year>2019</year>
          <month>11</month>
          <day>05</day>
          <volume>322</volume>
          <issue>17</issue>
          <fpage>1712</fpage>
          <lpage>3</lpage>
          <pub-id pub-id-type="doi">10.1001/jama.2019.14390</pub-id>
          <pub-id pub-id-type="medline">31688875</pub-id>
          <pub-id pub-id-type="pii">2753884</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kahlor</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Mackert</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Perceptions of infertility information and support sources among female patients who access the internet</article-title>
          <source>Fertil Steril</source>
          <year>2009</year>
          <month>01</month>
          <volume>91</volume>
          <issue>1</issue>
          <fpage>83</fpage>
          <lpage>90</lpage>
          <pub-id pub-id-type="doi">10.1016/j.fertnstert.2007.11.005</pub-id>
          <pub-id pub-id-type="medline">18243181</pub-id>
          <pub-id pub-id-type="pii">S0015-0282(07)03970-2</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Guntuku</surname>
              <given-names>SC</given-names>
            </name>
            <name name-style="western">
              <surname>Yaden</surname>
              <given-names>DB</given-names>
            </name>
            <name name-style="western">
              <surname>Kern</surname>
              <given-names>ML</given-names>
            </name>
            <name name-style="western">
              <surname>Ungar</surname>
              <given-names>LH</given-names>
            </name>
            <name name-style="western">
              <surname>Eichstaedt</surname>
              <given-names>JC</given-names>
            </name>
          </person-group>
          <article-title>Detecting depression and mental illness on social media: an integrative review</article-title>
          <source>Curr Opin Behav Sci</source>
          <year>2017</year>
          <month>12</month>
          <volume>18</volume>
          <fpage>43</fpage>
          <lpage>9</lpage>
          <pub-id pub-id-type="doi">10.1016/j.cobeha.2017.07.005</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Karmen</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Hsiung</surname>
              <given-names>RC</given-names>
            </name>
            <name name-style="western">
              <surname>Wetter</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Screening internet forum participants for depression symptoms by assembling and enhancing multiple NLP methods</article-title>
          <source>Comput Methods Programs Biomed</source>
          <year>2015</year>
          <month>06</month>
          <volume>120</volume>
          <issue>1</issue>
          <fpage>27</fpage>
          <lpage>36</lpage>
          <pub-id pub-id-type="doi">10.1016/j.cmpb.2015.03.008</pub-id>
          <pub-id pub-id-type="medline">25891366</pub-id>
          <pub-id pub-id-type="pii">S0169-2607(15)00062-0</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dreisbach</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Koleck</surname>
              <given-names>TA</given-names>
            </name>
            <name name-style="western">
              <surname>Bourne</surname>
              <given-names>PE</given-names>
            </name>
            <name name-style="western">
              <surname>Bakken</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>A systematic review of natural language processing and text mining of symptoms from electronic patient-authored text data</article-title>
          <source>Int J Med Inform</source>
          <year>2019</year>
          <month>05</month>
          <volume>125</volume>
          <fpage>37</fpage>
          <lpage>46</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/30914179"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.ijmedinf.2019.02.008</pub-id>
          <pub-id pub-id-type="medline">30914179</pub-id>
          <pub-id pub-id-type="pii">S1386-5056(18)31378-9</pub-id>
          <pub-id pub-id-type="pmcid">PMC6438188</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chapman</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Raymond</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Powell</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Potential of social media as a tool to combat foodborne illness</article-title>
          <source>Perspect Public Health</source>
          <year>2014</year>
          <month>07</month>
          <volume>134</volume>
          <issue>4</issue>
          <fpage>225</fpage>
          <lpage>30</lpage>
          <pub-id pub-id-type="doi">10.1177/1757913914538015</pub-id>
          <pub-id pub-id-type="medline">24990140</pub-id>
          <pub-id pub-id-type="pii">134/4/225</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Harris</surname>
              <given-names>JK</given-names>
            </name>
            <name name-style="western">
              <surname>Mansour</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Choucair</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Olson</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Nissen</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Bhatt</surname>
              <given-names>J</given-names>
            </name>
            <collab>Centers for Disease ControlPrevention</collab>
          </person-group>
          <article-title>Health department use of social media to identify foodborne illness - Chicago, Illinois, 2013-2014</article-title>
          <source>MMWR Morb Mortal Wkly Rep</source>
          <year>2014</year>
          <month>08</month>
          <day>15</day>
          <volume>63</volume>
          <issue>32</issue>
          <fpage>681</fpage>
          <lpage>5</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.cdc.gov/mmwr/preview/mmwrhtml/mm6332a1.htm"/>
          </comment>
          <pub-id pub-id-type="medline">25121710</pub-id>
          <pub-id pub-id-type="pii">mm6332a1</pub-id>
          <pub-id pub-id-type="pmcid">PMC4584908</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Casas</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Mugellini</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Abou</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Early detection of foodborne illnesses in social media</article-title>
          <source>Proceedings of the 2nd International Conference on Human Interaction and Emerging Technologies: Future Applications (IHIET-AI 2020)</source>
          <year>2020</year>
          <conf-name>2nd International Conference on Human Interaction and Emerging Technologies: Future Applications (IHIET-AI 2020)</conf-name>
          <conf-date>April 23-25, 2020</conf-date>
          <conf-loc>Lausanne, Switzerland</conf-loc>
          <publisher-loc>Lausanne, Switzerland</publisher-loc>
          <publisher-name>Springer</publisher-name>
          <fpage>415</fpage>
          <lpage>20</lpage>
          <pub-id pub-id-type="doi">10.1007/978-3-030-44267-5_62</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>McGough</surname>
              <given-names>SF</given-names>
            </name>
            <name name-style="western">
              <surname>Brownstein</surname>
              <given-names>JS</given-names>
            </name>
            <name name-style="western">
              <surname>Hawkins</surname>
              <given-names>JB</given-names>
            </name>
            <name name-style="western">
              <surname>Santillana</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Forecasting zika incidence in the 2016 Latin America outbreak combining traditional disease surveillance with search, social media, and news report data</article-title>
          <source>PLoS Negl Trop Dis</source>
          <year>2017</year>
          <month>01</month>
          <volume>11</volume>
          <issue>1</issue>
          <fpage>e0005295</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://journals.plos.org/plosntds/article?id=10.1371/journal.pntd.0005295"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pntd.0005295</pub-id>
          <pub-id pub-id-type="medline">28085877</pub-id>
          <pub-id pub-id-type="pii">PNTD-D-16-01733</pub-id>
          <pub-id pub-id-type="pmcid">PMC5268704</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Han</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Zhong</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Xie</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zhi</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Health information on social media helps mitigate Crohn's disease symptoms and improves patients' clinical course</article-title>
          <source>Comput Hum Behav</source>
          <year>2021</year>
          <month>02</month>
          <volume>115</volume>
          <fpage>106588</fpage>
          <pub-id pub-id-type="doi">10.1016/j.chb.2020.106588</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pandrekar</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Gopalkrishna</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Srivastava</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Saltz</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Saltz</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Social media based analysis of opioid epidemic using Reddit</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2018</year>
          <conf-name>AMIA Annual Symposium</conf-name>
          <conf-date>November 3-7, 2018</conf-date>
          <conf-loc>San Francisco, CA</conf-loc>
          <fpage>867</fpage>
          <lpage>76</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/30815129"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Marques-Toledo</surname>
              <given-names>CD</given-names>
            </name>
            <name name-style="western">
              <surname>Degener</surname>
              <given-names>CM</given-names>
            </name>
            <name name-style="western">
              <surname>Vinhal</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Coelho</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Meira</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Codeço</surname>
              <given-names>CT</given-names>
            </name>
            <name name-style="western">
              <surname>Teixeira</surname>
              <given-names>MM</given-names>
            </name>
          </person-group>
          <article-title>Dengue prediction by the web: tweets are a useful tool for estimating and forecasting Dengue at country and city level</article-title>
          <source>PLoS Negl Trop Dis</source>
          <year>2017</year>
          <month>07</month>
          <volume>11</volume>
          <issue>7</issue>
          <fpage>e0005729</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pntd.0005729"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pntd.0005729</pub-id>
          <pub-id pub-id-type="medline">28719659</pub-id>
          <pub-id pub-id-type="pii">PNTD-D-16-01761</pub-id>
          <pub-id pub-id-type="pmcid">PMC5533462</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Signorini</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Segre</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Polgreen</surname>
              <given-names>PM</given-names>
            </name>
          </person-group>
          <article-title>The use of Twitter to track levels of disease activity and public concern in the U.S. during the influenza A H1N1 pandemic</article-title>
          <source>PLoS One</source>
          <year>2011</year>
          <volume>6</volume>
          <issue>5</issue>
          <fpage>e19467</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pone.0019467"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0019467</pub-id>
          <pub-id pub-id-type="medline">21573238</pub-id>
          <pub-id pub-id-type="pii">PONE-D-10-02464</pub-id>
          <pub-id pub-id-type="pmcid">PMC3087759</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Broniatowski</surname>
              <given-names>DA</given-names>
            </name>
            <name name-style="western">
              <surname>Paul</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Dredze</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>National and local influenza surveillance through Twitter: an analysis of the 2012-2013 influenza epidemic</article-title>
          <source>PLoS One</source>
          <year>2013</year>
          <volume>8</volume>
          <issue>12</issue>
          <fpage>e83672</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pone.0083672"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0083672</pub-id>
          <pub-id pub-id-type="medline">24349542</pub-id>
          <pub-id pub-id-type="pii">PONE-D-13-35058</pub-id>
          <pub-id pub-id-type="pmcid">PMC3857320</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Klembczyk</surname>
              <given-names>JJ</given-names>
            </name>
            <name name-style="western">
              <surname>Jalalpour</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Levin</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Washington</surname>
              <given-names>RE</given-names>
            </name>
            <name name-style="western">
              <surname>Pines</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Rothman</surname>
              <given-names>RE</given-names>
            </name>
            <name name-style="western">
              <surname>Dugas</surname>
              <given-names>AF</given-names>
            </name>
          </person-group>
          <article-title>Google flu trends spatial variability validated against emergency department influenza-related visits</article-title>
          <source>J Med Internet Res</source>
          <year>2016</year>
          <volume>18</volume>
          <issue>6</issue>
          <fpage>e175</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.jmir.org/2016/6/e175/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/jmir.5585</pub-id>
          <pub-id pub-id-type="medline">27354313</pub-id>
          <pub-id pub-id-type="pii">v18i6e175</pub-id>
          <pub-id pub-id-type="pmcid">PMC4942685</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Eysenbach</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Infodemiology and infoveillance: framework for an emerging set of public health informatics methods to analyze search, communication and publication behavior on the internet</article-title>
          <source>J Med Internet Res</source>
          <year>2009</year>
          <volume>11</volume>
          <issue>1</issue>
          <fpage>e11</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.jmir.org/2009/1/e11/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/jmir.1157</pub-id>
          <pub-id pub-id-type="medline">19329408</pub-id>
          <pub-id pub-id-type="pii">v11i1e11</pub-id>
          <pub-id pub-id-type="pmcid">PMC2762766</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Cuomo</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Purushothaman</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Mackey</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Data mining and content analysis of Chinese social media platform Weibo during early COVID-19 outbreak: a retrospective observational infoveillance study</article-title>
          <source>JMIR Public Health Surveill</source>
          <year>2020</year>
          <month>04</month>
          <day>14</day>
          <volume>6</volume>
          <issue>2</issue>
          <fpage>e18700</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://publichealth.jmir.org/2020/2/e18700/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/18700</pub-id>
          <pub-id pub-id-type="medline">32293582</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Cai</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Ge</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Zeng</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Ji</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Mining the characteristics of COVID-19 patients in China: analysis of social media posts</article-title>
          <source>J Med Internet Res</source>
          <year>2020</year>
          <month>05</month>
          <day>17</day>
          <volume>22</volume>
          <issue>5</issue>
          <fpage>e19087</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2020/5/e19087/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/19087</pub-id>
          <pub-id pub-id-type="medline">32401210</pub-id>
          <pub-id pub-id-type="pii">v22i5e19087</pub-id>
          <pub-id pub-id-type="pmcid">PMC7236610</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="web">
          <article-title>2019 Plastic Surgery Statistics Report</article-title>
          <source>American Society of Plastic Surgeons (ASPS)</source>
          <year>2019</year>
          <access-date>2021-03-29</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.plasticsurgery.org/news/plastic-surgery-statistics?sub=2019+Plastic+Surgery+Statistics">https://www.plasticsurgery.org/news/plastic-surgery-statistics?sub=2019+Plastic+Surgery+Statistics</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="web">
          <article-title>2018 National Plastic Surgery Statistics</article-title>
          <source>American Society of Plastic Surgeons (ASPS)</source>
          <year>2018</year>
          <access-date>2019-07-18</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.plasticsurgery.org/documents/News/Statistics/2018/plastic-surgery-statistics-report-2018.pdf">https://www.plasticsurgery.org/documents/News/Statistics/2018/plastic-surgery-statistics-report-2018.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Balk</surname>
              <given-names>EM</given-names>
            </name>
            <name name-style="western">
              <surname>Earley</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Avendano</surname>
              <given-names>EA</given-names>
            </name>
            <name name-style="western">
              <surname>Raman</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Long-term health outcomes in women with silicone gel breast implants: a systematic review</article-title>
          <source>Ann Intern Med</source>
          <year>2016</year>
          <month>02</month>
          <day>02</day>
          <volume>164</volume>
          <issue>3</issue>
          <fpage>164</fpage>
          <lpage>75</lpage>
          <pub-id pub-id-type="doi">10.7326/M15-1169</pub-id>
          <pub-id pub-id-type="medline">26550776</pub-id>
          <pub-id pub-id-type="pii">2468813</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Watad</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Rosenberg</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Tiosano</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Tervaert</surname>
              <given-names>JW</given-names>
            </name>
            <name name-style="western">
              <surname>Yavne</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Shoenfeld</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Shalev</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Chodick</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Amital</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Silicone breast implants and the risk of autoimmune/rheumatic disorders: a real-world analysis</article-title>
          <source>Int J Epidemiol</source>
          <year>2018</year>
          <month>12</month>
          <day>01</day>
          <volume>47</volume>
          <issue>6</issue>
          <fpage>1846</fpage>
          <lpage>54</lpage>
          <pub-id pub-id-type="doi">10.1093/ije/dyy217</pub-id>
          <pub-id pub-id-type="medline">30329056</pub-id>
          <pub-id pub-id-type="pii">5133598</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Labadie</surname>
              <given-names>JG</given-names>
            </name>
            <name name-style="western">
              <surname>Korta</surname>
              <given-names>DZ</given-names>
            </name>
            <name name-style="western">
              <surname>Barton</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Mesinkovska</surname>
              <given-names>NA</given-names>
            </name>
          </person-group>
          <article-title>Cutaneous hypersensitivity-like reactions associated with breast implants: a review</article-title>
          <source>Dermatol Surg</source>
          <year>2018</year>
          <month>03</month>
          <volume>44</volume>
          <issue>3</issue>
          <fpage>323</fpage>
          <lpage>9</lpage>
          <pub-id pub-id-type="doi">10.1097/DSS.0000000000001448</pub-id>
          <pub-id pub-id-type="medline">29293108</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Calobrace</surname>
              <given-names>MB</given-names>
            </name>
            <name name-style="western">
              <surname>Stevens</surname>
              <given-names>WG</given-names>
            </name>
            <name name-style="western">
              <surname>Capizzi</surname>
              <given-names>PJ</given-names>
            </name>
            <name name-style="western">
              <surname>Cohen</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Godinez</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Beckstrand</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Risk factor analysis for capsular contracture: a 10-year sientra study using round, smooth, and textured implants for breast augmentation</article-title>
          <source>Plast Reconstr Surg</source>
          <year>2018</year>
          <month>04</month>
          <volume>141</volume>
          <issue>4S</issue>
          <fpage>20</fpage>
          <lpage>8</lpage>
          <pub-id pub-id-type="doi">10.1097/PRS.0000000000004351</pub-id>
          <pub-id pub-id-type="medline">29595715</pub-id>
          <pub-id pub-id-type="pii">00006534-201804001-00005</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rohrich</surname>
              <given-names>RJ</given-names>
            </name>
            <name name-style="western">
              <surname>Kaplan</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Dayan</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Silicone implant illness: science versus myth?</article-title>
          <source>Plast Reconstr Surg</source>
          <year>2019</year>
          <volume>144</volume>
          <issue>1</issue>
          <fpage>98</fpage>
          <lpage>109</lpage>
          <pub-id pub-id-type="doi">10.1097/prs.0000000000005710</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Coroneos</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Selber</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Offodile</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Butler</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Clemens</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>US FDA breast implant postapproval studies: long-term outcomes in 99,993 patients</article-title>
          <source>Ann Surg</source>
          <year>2019</year>
          <month>01</month>
          <volume>269</volume>
          <issue>1</issue>
          <fpage>30</fpage>
          <lpage>6</lpage>
          <pub-id pub-id-type="doi">10.1097/SLA.0000000000002990</pub-id>
          <pub-id pub-id-type="medline">30222598</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gabriel</surname>
              <given-names>SE</given-names>
            </name>
            <name name-style="western">
              <surname>O'Fallon</surname>
              <given-names>WM</given-names>
            </name>
            <name name-style="western">
              <surname>Kurland</surname>
              <given-names>LT</given-names>
            </name>
            <name name-style="western">
              <surname>Beard</surname>
              <given-names>CM</given-names>
            </name>
            <name name-style="western">
              <surname>Woods</surname>
              <given-names>JE</given-names>
            </name>
            <name name-style="western">
              <surname>Melton</surname>
              <given-names>LJ</given-names>
            </name>
          </person-group>
          <article-title>Risk of connective-tissue diseases and other disorders after breast implantation</article-title>
          <source>N Engl J Med</source>
          <year>1994</year>
          <month>06</month>
          <day>16</day>
          <volume>330</volume>
          <issue>24</issue>
          <fpage>1697</fpage>
          <lpage>702</lpage>
          <pub-id pub-id-type="doi">10.1056/NEJM199406163302401</pub-id>
          <pub-id pub-id-type="medline">8190133</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Peters</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Fornasier</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Lugowski</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Ibanez</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>An outcome analysis of 100 women after explantation of silicone gel breast implants</article-title>
          <source>Ann Plast Surg</source>
          <year>1997</year>
          <month>07</month>
          <volume>39</volume>
          <issue>1</issue>
          <fpage>9</fpage>
          <lpage>19</lpage>
          <pub-id pub-id-type="doi">10.1097/00000637-199707000-00002</pub-id>
          <pub-id pub-id-type="medline">9229086</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Janowsky</surname>
              <given-names>EC</given-names>
            </name>
            <name name-style="western">
              <surname>Kupper</surname>
              <given-names>LL</given-names>
            </name>
            <name name-style="western">
              <surname>Hulka</surname>
              <given-names>BS</given-names>
            </name>
          </person-group>
          <article-title>Meta-analyses of the relation between silicone breast implants and the risk of connective-tissue diseases</article-title>
          <source>N Engl J Med</source>
          <year>2000</year>
          <month>03</month>
          <day>16</day>
          <volume>342</volume>
          <issue>11</issue>
          <fpage>781</fpage>
          <lpage>90</lpage>
          <pub-id pub-id-type="doi">10.1056/NEJM200003163421105</pub-id>
          <pub-id pub-id-type="medline">10717013</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rohrich</surname>
              <given-names>RJ</given-names>
            </name>
            <name name-style="western">
              <surname>Kenkel</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Adams</surname>
              <given-names>WP</given-names>
            </name>
            <name name-style="western">
              <surname>Beran</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Conner</surname>
              <given-names>WC</given-names>
            </name>
          </person-group>
          <article-title>A prospective analysis of patients undergoing silicone breast implant explantation</article-title>
          <source>Plast Reconstr Surg</source>
          <year>2000</year>
          <month>06</month>
          <volume>105</volume>
          <issue>7</issue>
          <fpage>2529</fpage>
          <lpage>38</lpage>
          <pub-id pub-id-type="doi">10.1097/00006534-200006000-00036</pub-id>
          <pub-id pub-id-type="medline">10845310</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nahabedian</surname>
              <given-names>MY</given-names>
            </name>
            <name name-style="western">
              <surname>Tsangaris</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Momen</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Manson</surname>
              <given-names>PN</given-names>
            </name>
          </person-group>
          <article-title>Infectious complications following breast reconstruction with expanders and implants</article-title>
          <source>Plast Reconstr Surg</source>
          <year>2003</year>
          <month>08</month>
          <volume>112</volume>
          <issue>2</issue>
          <fpage>467</fpage>
          <lpage>76</lpage>
          <pub-id pub-id-type="doi">10.1097/01.PRS.0000070727.02992.54</pub-id>
          <pub-id pub-id-type="medline">12900604</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Siggelkow</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Klosterhalfen</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Klinge</surname>
              <given-names>U</given-names>
            </name>
            <name name-style="western">
              <surname>Rath</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Faridi</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Analysis of local complications following explantation of silicone breast implants</article-title>
          <source>Breast</source>
          <year>2004</year>
          <month>04</month>
          <volume>13</volume>
          <issue>2</issue>
          <fpage>122</fpage>
          <lpage>8</lpage>
          <pub-id pub-id-type="doi">10.1016/j.breast.2003.08.003</pub-id>
          <pub-id pub-id-type="medline">15019692</pub-id>
          <pub-id pub-id-type="pii">S0960977603001887</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Cook</surname>
              <given-names>NR</given-names>
            </name>
            <name name-style="western">
              <surname>Shadick</surname>
              <given-names>NA</given-names>
            </name>
            <name name-style="western">
              <surname>Pereira</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Buring</surname>
              <given-names>JE</given-names>
            </name>
          </person-group>
          <article-title>Prospective cohort study of breast implants and the risk of connective-tissue diseases</article-title>
          <source>Int J Epidemiol</source>
          <year>2011</year>
          <month>02</month>
          <volume>40</volume>
          <issue>1</issue>
          <fpage>230</fpage>
          <lpage>8</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/20943932"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/ije/dyq164</pub-id>
          <pub-id pub-id-type="medline">20943932</pub-id>
          <pub-id pub-id-type="pii">dyq164</pub-id>
          <pub-id pub-id-type="pmcid">PMC3043280</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>SY</given-names>
            </name>
            <name name-style="western">
              <surname>Israel</surname>
              <given-names>JS</given-names>
            </name>
            <name name-style="western">
              <surname>Afifi</surname>
              <given-names>AM</given-names>
            </name>
          </person-group>
          <article-title>Breast implant illness: symptoms, patient concerns, and the power of social media</article-title>
          <source>Plast Reconstr Surg</source>
          <year>2017</year>
          <month>11</month>
          <volume>140</volume>
          <issue>5</issue>
          <fpage>765</fpage>
          <lpage>6</lpage>
          <pub-id pub-id-type="doi">10.1097/PRS.0000000000003785</pub-id>
          <pub-id pub-id-type="medline">28753149</pub-id>
          <pub-id pub-id-type="pii">00006534-201711000-00061</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>SY</given-names>
            </name>
            <name name-style="western">
              <surname>Israel</surname>
              <given-names>JS</given-names>
            </name>
            <name name-style="western">
              <surname>Poore</surname>
              <given-names>SO</given-names>
            </name>
            <name name-style="western">
              <surname>Afifi</surname>
              <given-names>AM</given-names>
            </name>
          </person-group>
          <article-title>Facebook facts: breast reconstruction patient-reported outcomes using social media</article-title>
          <source>Plast Reconstr Surg</source>
          <year>2018</year>
          <month>05</month>
          <volume>141</volume>
          <issue>5</issue>
          <fpage>1106</fpage>
          <lpage>13</lpage>
          <pub-id pub-id-type="doi">10.1097/PRS.0000000000004275</pub-id>
          <pub-id pub-id-type="medline">29697604</pub-id>
          <pub-id pub-id-type="pii">00006534-201805000-00007</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Magnusson</surname>
              <given-names>MR</given-names>
            </name>
            <name name-style="western">
              <surname>Cooter</surname>
              <given-names>RD</given-names>
            </name>
            <name name-style="western">
              <surname>Rakhorst</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>McGuire</surname>
              <given-names>PA</given-names>
            </name>
            <name name-style="western">
              <surname>Adams</surname>
              <given-names>WP</given-names>
            </name>
            <name name-style="western">
              <surname>Deva</surname>
              <given-names>AK</given-names>
            </name>
          </person-group>
          <article-title>Breast implant illness: a way forward</article-title>
          <source>Plast Reconstr Surg</source>
          <year>2019</year>
          <month>03</month>
          <volume>143</volume>
          <issue>3S</issue>
          <fpage>74</fpage>
          <lpage>81</lpage>
          <pub-id pub-id-type="doi">10.1097/PRS.0000000000005573</pub-id>
          <pub-id pub-id-type="medline">30817559</pub-id>
          <pub-id pub-id-type="pii">00006534-201903001-00012</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref49">
        <label>49</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Adidharma</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Latack</surname>
              <given-names>KR</given-names>
            </name>
            <name name-style="western">
              <surname>Colohan</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Morrison</surname>
              <given-names>SD</given-names>
            </name>
            <name name-style="western">
              <surname>Cederna</surname>
              <given-names>PS</given-names>
            </name>
          </person-group>
          <article-title>Breast implant illness: are social media and the internet worrying patients sick?</article-title>
          <source>Plast Reconstr Surg</source>
          <year>2020</year>
          <month>01</month>
          <volume>145</volume>
          <issue>1</issue>
          <fpage>225</fpage>
          <lpage>7</lpage>
          <pub-id pub-id-type="doi">10.1097/PRS.0000000000006361</pub-id>
          <pub-id pub-id-type="medline">31625990</pub-id>
          <pub-id pub-id-type="pii">00006534-202001000-00096</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref50">
        <label>50</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Keane</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Chi</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Ha</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Myckatyn</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>En bloc capsulectomy for breast implant illness: a social media phenomenon?</article-title>
          <source>Aesth Surg J</source>
          <year>2021</year>
          <volume>41</volume>
          <issue>4</issue>
          <fpage>448</fpage>
          <lpage>59</lpage>
          <pub-id pub-id-type="doi">10.1093/asj/sjaa203</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref51">
        <label>51</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wee</surname>
              <given-names>CE</given-names>
            </name>
            <name name-style="western">
              <surname>Younis</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Isbester</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Wangler</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Sarode</surname>
              <given-names>AL</given-names>
            </name>
            <name name-style="western">
              <surname>Patil</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Grunzweig</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Boas</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Harvey</surname>
              <given-names>DJ</given-names>
            </name>
            <name name-style="western">
              <surname>Kumar</surname>
              <given-names>AR</given-names>
            </name>
            <name name-style="western">
              <surname>Feng</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Understanding breast implant illness, before and after explantation: a patient-reported outcomes study</article-title>
          <source>Ann Plast Surg</source>
          <year>2020</year>
          <month>07</month>
          <volume>85</volume>
          <issue>S1 Suppl 1</issue>
          <fpage>82</fpage>
          <lpage>6</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/32530850"/>
          </comment>
          <pub-id pub-id-type="doi">10.1097/SAP.0000000000002446</pub-id>
          <pub-id pub-id-type="medline">32530850</pub-id>
          <pub-id pub-id-type="pii">00000637-202007001-00019</pub-id>
          <pub-id pub-id-type="pmcid">PMC7294749</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref52">
        <label>52</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ponraja</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>McLeod</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Chong</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Breast implant illness: a biofilm hypothesis</article-title>
          <source>Plast Reconstr Surg Glob Open</source>
          <year>2020</year>
          <month>04</month>
          <volume>8</volume>
          <issue>4</issue>
          <fpage>e2755</fpage>
          <pub-id pub-id-type="doi">10.1097/GOX.0000000000002755</pub-id>
          <pub-id pub-id-type="medline">32440423</pub-id>
          <pub-id pub-id-type="pmcid">PMC7209857</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref53">
        <label>53</label>
        <nlm-citation citation-type="web">
          <source>Blog - Cancer.net</source>
          <access-date>2021-01-05</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.cancer.net/blog">https://www.cancer.net/blog</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref54">
        <label>54</label>
        <nlm-citation citation-type="web">
          <source>Blog - Living Beyond Breast Cancer</source>
          <access-date>2021-01-05</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.lbbc.org/blog">https://www.lbbc.org/blog</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref55">
        <label>55</label>
        <nlm-citation citation-type="web">
          <article-title>Stories from patients with breast, lung and other cancers</article-title>
          <source>Cancer Treatment Centers of America</source>
          <access-date>2021-01-05</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.cancercenter.com/patient-stories">https://www.cancercenter.com/patient-stories</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref56">
        <label>56</label>
        <nlm-citation citation-type="web">
          <article-title>Chronic illness</article-title>
          <source>Mighty Well Archives</source>
          <access-date>2021-01-05</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://blog.mighty-well.com/category/chronic-illness/">https://blog.mighty-well.com/category/chronic-illness/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref57">
        <label>57</label>
        <nlm-citation citation-type="web">
          <article-title>Practical pain management - symptoms, causes, treatments, medications for chronic pain</article-title>
          <source>Remedy Health Media, LLC</source>
          <access-date>2021-01-05</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.practicalpainmanagement.com/patients">https://www.practicalpainmanagement.com/patients</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref58">
        <label>58</label>
        <nlm-citation citation-type="web">
          <article-title>Resources: for patients</article-title>
          <source>Body Politic</source>
          <access-date>2021-01-05</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.wearebodypolitic.com/resources">https://www.wearebodypolitic.com/resources</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref59">
        <label>59</label>
        <nlm-citation citation-type="web">
          <article-title>Coronavirus blog team</article-title>
          <source>Medium</source>
          <access-date>2021-01-05</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medium.com/@coronavirus_blog_team">https://medium.com/@coronavirus_blog_team</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref60">
        <label>60</label>
        <nlm-citation citation-type="web">
          <article-title>COVID-19 patient stories</article-title>
          <source>Johns Hopkins Medicine</source>
          <access-date>2021-01-05</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.hopkinsmedicine.org/coronavirus/patient-stories/">https://www.hopkinsmedicine.org/coronavirus/patient-stories/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref61">
        <label>61</label>
        <nlm-citation citation-type="web">
          <article-title>About breast implant illness</article-title>
          <source>Breast Implant Illness</source>
          <access-date>2019-05-10</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.breastimplantillness.com/symptoms/">https://www.breastimplantillness.com/symptoms/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref62">
        <label>62</label>
        <nlm-citation citation-type="web">
          <article-title>Breast implant illness - symptoms, explant, surgeons, detox</article-title>
          <source>Healing Breast Implant Illness</source>
          <access-date>2019-05-10</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://healingbreastimplantillness.com">https://healingbreastimplantillness.com</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref63">
        <label>63</label>
        <nlm-citation citation-type="web">
          <article-title>#breastimplantillness hashtag on Instagram</article-title>
          <source>Instagram</source>
          <access-date>2019-09-05</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.instagram.com/explore/tags/breastimplantillness">https://www.instagram.com/explore/tags/breastimplantillness</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref64">
        <label>64</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Savova</surname>
              <given-names>GK</given-names>
            </name>
            <name name-style="western">
              <surname>Masanz</surname>
              <given-names>JJ</given-names>
            </name>
            <name name-style="western">
              <surname>Ogren</surname>
              <given-names>PV</given-names>
            </name>
            <name name-style="western">
              <surname>Zheng</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Sohn</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kipper-Schuler</surname>
              <given-names>KC</given-names>
            </name>
            <name name-style="western">
              <surname>Chute</surname>
              <given-names>CG</given-names>
            </name>
          </person-group>
          <article-title>Mayo clinical Text Analysis and Knowledge Extraction System (cTAKES): architecture, component evaluation and applications</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2010</year>
          <volume>17</volume>
          <issue>5</issue>
          <fpage>507</fpage>
          <lpage>13</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://jamia.oxfordjournals.org/lookup/pmidlookup?view=long&#38;pmid=20819853"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/jamia.2009.001560</pub-id>
          <pub-id pub-id-type="medline">20819853</pub-id>
          <pub-id pub-id-type="pii">17/5/507</pub-id>
          <pub-id pub-id-type="pmcid">PMC2995668</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref65">
        <label>65</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bodenreider</surname>
              <given-names>O</given-names>
            </name>
          </person-group>
          <article-title>The Unified Medical Language System (UMLS): integrating biomedical terminology</article-title>
          <source>Nucleic Acids Res</source>
          <year>2004</year>
          <month>01</month>
          <day>1</day>
          <volume>32</volume>
          <issue>Database issue</issue>
          <fpage>267</fpage>
          <lpage>70</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://nar.oxfordjournals.org/cgi/pmidlookup?view=long&#38;pmid=14681409"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/nar/gkh061</pub-id>
          <pub-id pub-id-type="medline">14681409</pub-id>
          <pub-id pub-id-type="pii">32/suppl_1/D267</pub-id>
          <pub-id pub-id-type="pmcid">PMC308795</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref66">
        <label>66</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Blei</surname>
              <given-names>DM</given-names>
            </name>
            <name name-style="western">
              <surname>Ng</surname>
              <given-names>AY</given-names>
            </name>
            <name name-style="western">
              <surname>Jordan</surname>
              <given-names>MI</given-names>
            </name>
          </person-group>
          <article-title>Latent Dirichlet allocation</article-title>
          <source>J Mach Learn Res</source>
          <year>2003</year>
          <volume>3</volume>
          <fpage>993</fpage>
          <lpage>1022</lpage>
          <pub-id pub-id-type="doi">10.1016/B978-0-12-411519-4.00006-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref67">
        <label>67</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Loper</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Bird</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>NLTK: the Natural Language Toolkit</article-title>
          <source>Proceedings of the ACL-02 Workshop on Effective Tools and Methodologies for Teaching Natural Language Processing and Computational Linguistics</source>
          <year>2002</year>
          <conf-name>ACL-02 Workshop on Effective Tools and Methodologies for Teaching Natural Language Processing and Computational Linguistics</conf-name>
          <conf-date>July 7, 2002</conf-date>
          <conf-loc>Philadelphia Pennsylvania</conf-loc>
          <publisher-loc>USA</publisher-loc>
          <publisher-name>Association for Computational Linguistics</publisher-name>
          <fpage>63</fpage>
          <lpage>70</lpage>
          <pub-id pub-id-type="doi">10.3115/1118108.1118117</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref68">
        <label>68</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Blei</surname>
              <given-names>DM</given-names>
            </name>
          </person-group>
          <article-title>C implementation of variational EM for latent Dirichlet Allocation (LDA)</article-title>
          <source>Github</source>
          <year>2013</year>
          <access-date>2019-07-02</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://github.com/blei-lab/lda-c">https://github.com/blei-lab/lda-c</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref69">
        <label>69</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hofmann</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Probabilistic latent semantic indexing</article-title>
          <source>Proceedings of the 22nd Annual International Acm Sigir Conference on Research and Development in Information Retrieval</source>
          <year>1999</year>
          <conf-name>SIGIR99: 22nd Annual International ACM SIGIR Conference on Research and Development in Information Retrieval</conf-name>
          <conf-date>August 15 - 19, 1999</conf-date>
          <conf-loc>Berkeley California USA</conf-loc>
          <publisher-loc>United States</publisher-loc>
          <publisher-name>Association for Computing Machinery</publisher-name>
          <fpage>50</fpage>
          <lpage>57</lpage>
          <pub-id pub-id-type="doi">10.1145/312624.312649</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref70">
        <label>70</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Blei</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Lafferty</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Correlated topic models</article-title>
          <source>Proceedings of the Advances in Neural Information Processing Systems</source>
          <year>2006</year>
          <conf-name>Advances in Neural Information Processing Systems</conf-name>
          <conf-date>December 4-7, 2006</conf-date>
          <conf-loc>Vancouver, Canada</conf-loc>
          <publisher-loc>Cambridge, United States</publisher-loc>
          <publisher-name>MIT Press</publisher-name>
          <pub-id pub-id-type="doi">10.5555/2976248.2976267</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref71">
        <label>71</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Boyd-Graber</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Gerrish</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Blei</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Reading tea leaves: how humans interpret topic models</article-title>
          <source>Proceedings of the Advances in Neural Information Processing Systems</source>
          <year>2009</year>
          <conf-name>Advances in Neural Information Processing Systems</conf-name>
          <conf-date>December 2009</conf-date>
          <conf-loc>Vancouver, Canada</conf-loc>
          <publisher-loc>United States</publisher-loc>
          <publisher-name>Curran Associates Inc</publisher-name>
          <pub-id pub-id-type="doi">10.5555/2984093.2984126</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
