<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMI</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Med Inform</journal-id>
      <journal-title>JMIR Medical Informatics</journal-title>
      <issn pub-type="epub">2291-9694</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v13i1e70940</article-id>
      <article-id pub-id-type="pmid">40939164</article-id>
      <article-id pub-id-type="doi">10.2196/70940</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Extracting Symptoms of Complex Conditions From Online Discourse (Subreddit to Symptomatology): Lexicon-Based Approach</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Castonguay</surname>
            <given-names>Alexandre</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Hwang</surname>
            <given-names>Sy</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Sauvayre</surname>
            <given-names>Romy</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Sivarajkumar</surname>
            <given-names>Sonish</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author">
          <name name-style="western">
            <surname>Hossain</surname>
            <given-names>Bushra</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0006-0941-0374</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Preum</surname>
            <given-names>Sarah M</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-7771-8323</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Rabbi</surname>
            <given-names>Md Fazle</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0004-1628-4519</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Ara</surname>
            <given-names>Rifat</given-names>
          </name>
          <degrees>MS</degrees>
          <xref rid="aff5" ref-type="aff">5</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0007-4191-5492</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Ali</surname>
            <given-names>Mohammed Eunus</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff6" ref-type="aff">6</xref>
          <address>
            <institution/>
            <institution>Faculty of Information Technology</institution>
            <institution>Monash University</institution>
            <addr-line>20 Exhibition Walk (Woodside Building)</addr-line>
            <addr-line>Clayton, VIC 3168</addr-line>
            <country>Australia</country>
            <phone>61 3 9905 1741</phone>
            <email>eunus.ali@monash.edu</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-0384-7616</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Department of Computer Science and Engineering</institution>
        <institution>Bangladesh University of Engineering and Technology</institution>
        <addr-line>Dhaka</addr-line>
        <country>Bangladesh</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Department of Computer Science</institution>
        <institution>Dartmouth College</institution>
        <addr-line>Hanover, NH</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Department of Biomedical Data Science</institution>
        <institution>Geisel School of Medicine</institution>
        <addr-line>Hanover, NH</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>Department of Computer Science and Engineering</institution>
        <institution>Bangladesh University of Professionals</institution>
        <addr-line>Dhaka</addr-line>
        <country>Bangladesh</country>
      </aff>
      <aff id="aff5">
        <label>5</label>
        <institution>Department of Obstetrics &#38; Gynecology</institution>
        <institution>Bangladesh College of Physicians and Surgeons</institution>
        <addr-line>Dhaka</addr-line>
        <country>Bangladesh</country>
      </aff>
      <aff id="aff6">
        <label>6</label>
        <institution>Faculty of Information Technology</institution>
        <institution>Monash University</institution>
        <addr-line>Clayton</addr-line>
        <country>Australia</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Mohammed Eunus Ali <email>eunus.ali@monash.edu</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2025</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>12</day>
        <month>9</month>
        <year>2025</year>
      </pub-date>
      <volume>13</volume>
      <elocation-id>e70940</elocation-id>
      <history>
        <date date-type="received">
          <day>6</day>
          <month>1</month>
          <year>2025</year>
        </date>
        <date date-type="rev-request">
          <day>26</day>
          <month>4</month>
          <year>2025</year>
        </date>
        <date date-type="rev-recd">
          <day>25</day>
          <month>5</month>
          <year>2025</year>
        </date>
        <date date-type="accepted">
          <day>9</day>
          <month>7</month>
          <year>2025</year>
        </date>
      </history>
      <copyright-statement>©Bushra Hossain, Sarah M Preum, Md Fazle Rabbi, Rifat Ara, Mohammed Eunus Ali. Originally published in JMIR Medical Informatics (https://medinform.jmir.org), 12.09.2025.</copyright-statement>
      <copyright-year>2025</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Informatics, is properly cited. The complete bibliographic information, a link to the original publication on https://medinform.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://medinform.jmir.org/2025/1/e70940" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Millions of people affected with complex medical conditions with diverse symptoms often turn to online discourse to share their experiences. While some studies have explored natural language processing methods and medical information extraction tools, these typically focus on generic symptoms in clinical notes and struggle to identify patient-reported, disease-specific, subtle symptoms from online health discourse.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>We aimed to extract patient-reported, disease-specific symptoms shared on social media reflecting the lived experiences of thousands of affected individuals and explore the characteristics, prevalence, and occurrence patterns of the symptoms.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>We propose a lexicon-based symptom extraction (LSE) method to identify a diverse list of disease-specific, patient-reported symptoms. We initially used a large language model to accelerate the extraction of symptom-related key phrases that formed the lexicon. We evaluated the effectiveness of lexicon extraction against human annotation using a Jaccard index score. We then leveraged BERT-Base, BioBERT, and Phrase-BERT–based embeddings to learn representations of these symptom-related key phrases and cluster similar symptoms using k-means and hierarchical density-based spatial clustering of applications with noise (HDBSCAN). Among the different options explored in our experiments, BioBERT-based k-means clustering was found to be the most effective. Finally, we applied symptom normalization to eliminate duplicate and redundant entries in the comprehensive symptom list.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>In a real-world polycystic ovary syndrome (PCOS) subreddit dataset, we found that LSE significantly outperformed state-of-the-art baselines, achieving at least 41% and 20% higher <italic>F</italic><sub>1</sub>-scores (mean 86.10) than automatic medical extraction tools and large language models, respectively. Notably, the comprehensive list of 64 PCOS symptoms generated via LSE ensured extensive coverage of symptoms reported in 7 reputable eHealth forums. Analyzing PCOS symptomatology revealed 28 potentially emerging symptoms and 8 self-reported comorbidities co-occurring with PCOS.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>The comprehensive patient-reported, disease-specific symptom list can help patients and health practitioners resolve uncertainties surrounding the disease, eliminating the variability of PCOS symptoms prevailing in the community. Analyzing PCOS symptomatology across varied dimensions provides valuable insights for public health research.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>complex medical condition</kwd>
        <kwd>polycystic ovary syndrome</kwd>
        <kwd>online discourse</kwd>
        <kwd>large language models</kwd>
        <kwd>natural language processing</kwd>
        <kwd>disease-specific symptoms</kwd>
        <kwd>health information extraction</kwd>
        <kwd>symptomatology</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <sec>
        <title>Background</title>
        <p>The rise of health 2.0 has significantly increased the consumption of health-related information on social media in recent years. Worldwide, 34.7% of adult internet users frequently search for health-related information online, with approximately 58.5% of adults in the United States specifically engaging in such searches as of 2023 [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref2">2</xref>]. Analyzing online discourse on health-related topics offers valuable insights into the lived experiences and perspectives of affected individuals [<xref ref-type="bibr" rid="ref3">3</xref>-<xref ref-type="bibr" rid="ref5">5</xref>]. The critical findings of these analyses are particularly significant for understanding complex medical conditions, such as different types of cancer, cognitive and mental health conditions, autoimmune disorders, and metabolic and endocrinological conditions. These medical conditions often manifest with diverse symptoms that vary significantly among patients [<xref ref-type="bibr" rid="ref6">6</xref>-<xref ref-type="bibr" rid="ref8">8</xref>]. Furthermore, there is often no consensus among established medical sources regarding the full range of possible symptoms for such conditions [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref10">10</xref>]. This variability poses challenges for patients, health care providers, and researchers seeking a comprehensive understanding of these symptoms and their characteristics. Thus, the study and analysis of symptoms associated with a disease, referred to as <italic>symptomatology</italic>, is crucial for understanding complex diseases [<xref ref-type="bibr" rid="ref11">11</xref>]. We argue that a robust approach to extracting disease-specific symptoms from individuals’ lived experiences shared on social media can address uncertainties surrounding complex medical conditions. This approach would also allow for the identification of symptoms that patients associate with a condition (eg, brain fog with post–COVID-19 condition), prevalence of symptom co-occurrence (eg, unexplained weight loss and pain with cancer), and how symptoms vary based on patients’ comorbidities and preexisting conditions.</p>
        <p>Recent advancements in natural language processing (NLP) have enabled public health researchers to explore medical information extraction tools [<xref ref-type="bibr" rid="ref12">12</xref>-<xref ref-type="bibr" rid="ref15">15</xref>] and develop novel techniques [<xref ref-type="bibr" rid="ref16">16</xref>-<xref ref-type="bibr" rid="ref18">18</xref>] for analyzing online health discourse, including patient-reported data from social media. However, off-the-shelf medical information extraction tools primarily excel in extracting well-known medical entities (eg, diseases, drugs, and basic symptoms). Their limitations become evident with granular, patient-centric details (eg, unusual symptom descriptions, implicit context, or subtle adverse events), which often require specialized rules or retrained models for accurate detection [<xref ref-type="bibr" rid="ref19">19</xref>-<xref ref-type="bibr" rid="ref22">22</xref>]. Modern transformer-based models used with medical named entity recognition have shown promising results in symptom extraction [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref24">24</xref>]. However, these models typically require large amounts of domain-specific data and are mostly trained on clinical notes (electronic health records), which limits their effectiveness when dealing with colloquial health discourse generated by patients [<xref ref-type="bibr" rid="ref7">7</xref>,<xref ref-type="bibr" rid="ref23">23</xref>-<xref ref-type="bibr" rid="ref25">25</xref>]. A family of bidirectional encoder representations from transformers (BERT)–based models fine-tuned on colloquial data markedly improves symptom recognition in informal texts; nevertheless, their error analysis indicates that the best-trained models still capture only approximately 25% to 50% of lengthy, figurative symptom phrases and continue to misclassify many subtle or previously unseen expressions (eg, “mild difficulty taking deep breaths” or “chest again felt a little tight”) [<xref ref-type="bibr" rid="ref26">26</xref>]. A recent NLP pipeline [<xref ref-type="bibr" rid="ref27">27</xref>] used to extract symptoms from patient narratives on social media proposed a dual-corpus symptom lexicon containing keywords (eg, <italic>fever</italic> and <italic>cough</italic>) and related modifiers (eg, <italic>mild</italic> or <italic>severe</italic>) followed by applying a rule-based postprocessing step to merge the 2. However, this fixed rule-based approach may struggle to report symptoms whenever people describe them implicitly, with spelling noise, or in new phrasing that never entered the seed lists (eg, “can’t breathe properly” or “my lungs felt on fire”).</p>
        <p>While the existing lexicon-based approaches have successfully used predefined resources and deep learning frameworks for broad public health surveillance, their reliance on explicit wording limits their ability to capture the full range of informal expressions. On the other hand, large language models (LLMs) have significantly accelerated medical NLP research, especially in the field of information extraction [<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref17">17</xref>,<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref28">28</xref>]. While some studies have demonstrated the potential of LLMs for health information extraction from social media [<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref30">30</xref>], they face challenges when extracting specific contexts such as health advice and disease-specific treatment [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref16">16</xref>].</p>
      </sec>
      <sec>
        <title>Objectives</title>
        <p>To overcome the aforementioned limitations of symptom extraction from social media discourse, we propose a novel NLP pipeline that systematically combines the capabilities of LLMs and other NLP methods with feedback from domain experts, resulting in a scalable and practical solution to the problem of symptom extraction from patient-reported social media discourse.</p>
        <p>While the proposed pipeline can be applied to explore a plethora of medical conditions for which there is an abundance of patient-reported online discourse, we focused on a common chronic condition with significant uncertainty, namely, polycystic ovary syndrome (PCOS), as a use case in this paper. According to the World Health Organization [<xref ref-type="bibr" rid="ref31">31</xref>], an estimated 116 million women (3.4% of reproductive-age women) worldwide are affected by PCOS, and its prevalence is on the rise. Despite its widespread impact, the full spectrum of PCOS remains insufficiently explored [<xref ref-type="bibr" rid="ref32">32</xref>]. Patients report a diverse range of symptoms that vary in severity depending on previous medical history and their effect on daily life. The combination of varied symptoms, insufficient treatment guidelines, and instances of medical gaslighting often leads to psychological distress, prompting many individuals to seek support and share experiences on social media platforms [<xref ref-type="bibr" rid="ref33">33</xref>], including Reddit. Existing research leveraging social media data to study PCOS is still underdeveloped [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref34">34</xref>-<xref ref-type="bibr" rid="ref36">36</xref>]. This creates a unique opportunity to systematically identify self-reported symptoms and related symptomatology based on the lived experiences of thousands of individuals and, thereby, inform the clinical understanding of this complex medical condition. We make 3 primary contributions. First, we developed a novel lexicon-based symptom extraction (LSE) method to identify diverse disease-specific symptoms from individuals’ experiences shared on social media. This method can effectively detect even subtle symptoms mentioned in user discourse. We applied our LSE method to a novel PCOS subreddit dataset, achieving statistically significant improvements over state-of-the-art medical NLP baselines.</p>
        <p>Second, we conducted an in-depth analysis of peer discussion threads on the extracted PCOS symptoms to reveal a set of lesser-known yet prevalent symptoms that individuals associate with PCOS and associated co-occurring symptoms and comorbidities. These findings can contribute to clinical research and public health research in a community-informed way.</p>
        <p>Third, we curated a novel Reddit dataset containing 59,962 and 641,441 relevant posts and comments, respectively. This dataset captures self-reported PCOS symptoms and their context from 68,010 affected individuals. In addition, we curated a human-annotated, labeled dataset of 1000 posts of patient-reported symptoms related to PCOS based on guidance from domain experts and patient input. We release these resources in a public domain. These unique, rich resources can enable medical NLP and computational health researchers to further investigate the symptomatology of complex medical conditions identified and analyzed online.</p>
      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Data Collection and Preprocessing</title>
        <p>We selected Reddit as a source of data because of its anonymous nature. It encourages users to share personal experiences on stigmatized topics [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref37">37</xref>]. The data collection process began with the identification of the r/PCOS subreddit by considering the group posts’ availability and popularity among 153,000 members engaging in discussions on PCOS. We systematically collected data from this subreddit using the <italic>Python Reddit API Wrapper</italic> package (Python Software Foundation) and the Pushshift application programming interface (API) [<xref ref-type="bibr" rid="ref38">38</xref>,<xref ref-type="bibr" rid="ref39">39</xref>]. We obtained all the posts and comments from the r/PCOS subreddit from August 4, 2010, to December 31, 2022. This timeline was chosen to ensure a comprehensive capture of recent as well as previous discussions. For each post, we retained the date, flair name, unique post ID, post title, post content, score, upvotes, and comments due to their utility and relevance.</p>
        <p>During preprocessing, we discarded entries with deleted posts or those in which the post content had &#60;5 words as the brevity poses challenges to deriving meaningful insights from posts. We also removed posts containing irrelevant text (eg, polls, survey links only, or URLs). The URL-heavy posts were classified using a rule-based heuristic combining personal pronoun frequency and URL-to-text ratio. We provide a summary of the steps to remove irrelevant text from social media data in Table S1 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. This filtering process enabled us to focus on patient-authored, experience-rich discussions. Finally, we obtained a primary dataset comprising 59,962 posts and 641,441 comments by 68,010 active unique users. Identifying task-relevant data is crucial for data-driven approaches [<xref ref-type="bibr" rid="ref12">12</xref>] as it significantly impacts the efficiency of downstream tasks. We leveraged Reddit’s post “flair” option to filter relevant data. On Reddit, a post flair is a customizable text or icon that appears next to a post title to provide additional context or categorization, similar to hashtags available on other platforms. We reviewed 30 randomly selected posts from several flairs of the PCOS subreddit. We identified that, among all the flairs, posts in the “General/Advice” flair were more likely to share knowledge and seek advice on symptoms. Further investigation on the most frequent unigrams of these flairs supported our qualitative analysis, where the presence of symptom-related unigrams such as “period,” “symptom,” “doctor,” “birth,” “control,” and “diagnosed” was predominantly observed in the “General/Advice” flair. The distribution of frequent unigrams in the “General/Advice” flair is shown in Figure S1 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. On the basis of these findings, we chose the “General/Advice” flair for extracting a wide range of symptoms. In addition, the “General/Advice” flair is more popular in the community as it contains the highest number of posts, as shown in Table S2 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. This selection ensured a broad range of symptoms and valuable insights. Finally, we developed a corpus of 10,500 posts for the symptom identification task, randomly selected from the posts with the “General/Advice” flair.</p>
      </sec>
      <sec>
        <title>Our Method: LSE</title>
        <p>We propose an LSE method to analyze self-reported symptoms of a complex medical condition using social media discourse. Our proposed method consists of three main steps: (1) symptom-related lexicon extraction, (2) symptom identification, and (3) symptom normalization, as illustrated in <xref rid="figure1" ref-type="fig">Figure 1</xref>.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Steps of the lexicon-based symptom extraction method. JI: Jaccard index; LLM: large language model.</p>
          </caption>
          <graphic xlink:href="medinform_v13i1e70940_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <sec>
          <title>Symptom-Related Lexicon Extraction</title>
          <p>We leveraged symptom-related key phrases for lexicon extraction as it helped distill the most relevant terms and phrases associated with physical manifestations from user narratives. We focused on extracting the key symptom-related phrases instead of the symptoms as the latter results in extracting (1) phrases that are not relevant and (2) repetitive mentions of the same symptoms, rendering the subsequent analysis challenging. Compared to the tedious and time-intensive task of manual extraction, LLMs emerge as a more economical choice, offering consistency in their responses, especially when the temperature setting is near 0 [<xref ref-type="bibr" rid="ref40">40</xref>,<xref ref-type="bibr" rid="ref41">41</xref>]. We used the OpenAI API <italic>gpt-3.5-turbo-16k</italic> [<xref ref-type="bibr" rid="ref42">42</xref>] to annotate 10,500 user posts. To ensure precision in identifying the physical manifestation of the condition, we emphasized physical symptoms while excluding psychological aspects in our base prompt using a zero-shot prompting strategy (Figure S2 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). The API responses were stored in a JSON line format containing key phrases and corresponding posts. This process yielded a lexicon of 30,370 symptom-related key phrases that we used in the subsequent steps.</p>
          <p>We resorted to human annotation to validate the extraction conducted by ChatGPT (OpenAI). We employed 2 graduate students in the science, technology, engineering, and mathematics field particularly active in women’s health–related social media forums. Before annotation, they underwent multiple training sessions led by a domain expert specializing in computational health. These sessions were designed to refine their understanding on key phrase extraction and promote annotation consistency. On a sample set of 30 posts, the interannotator agreement reached 92% in a relaxed match. Finally, we randomly selected 500 entries from 10,500 user posts. We recognize that many social media and health NLP studies use larger annotated sets, often containing 2000 to 4000 messages, and few drop below 1000 annotations [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref43">43</xref>-<xref ref-type="bibr" rid="ref45">45</xref>]. However, those datasets are typically used to validate end-to-end model performance, whereas our 500-post sample supported a specific component of our pipeline. We deliberately divided tasks between the LLM and human experts to balance coverage and precision while remaining practical as (1) the cost in terms of time and resources was significant (eg, annotating just 500 entries required 4 training sessions × 3 hours = 12 hours, 35 hours for literature study and documentation, and 208.3 hours approximately for annotation per post; 500 posts × 25 minutes), making larger samples prohibitively expensive; (2) we observed a significant drop in new symptom-related key phrase discoveries after the first 200 posts, mirroring the classic “diminishing returns” shown in Table S3 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>, also evident in social media symptom mining and related tasks [<xref ref-type="bibr" rid="ref46">46</xref>]; and (3) during manual inspection, we observed minimal disagreement as the annotation task was primarily syntactic rather than interpretive. Taking into consideration the above 3 points, we assigned 250 unique posts to each annotator to minimize bias and enhance the quality of our annotated set.</p>
          <p>We choose the Jaccard index (JI) to measure the similarity between key phrases extracted by ChatGPT and the human annotators [<xref ref-type="bibr" rid="ref12">12</xref>]. This required normalizing the extracted key phrases (eg, changing “pressure in pelvic area” to “pelvic pressure”) to maintain homogeneity in both lists. We computed the JI similarity for each post in the sample using exact key phrase match. <xref ref-type="table" rid="table1">Table 1</xref> shows 3 posts from our sample set with extracted key phrases and their corresponding JI scores. The average JI score was 74%, indicating moderate lexical similarity between the key phrases extracted by ChatGPT and the human annotators considering the complexity of the task [<xref ref-type="bibr" rid="ref47">47</xref>]. Our manual investigation of all missed or incorrectly extracted key phrases by the LLM revealed 5 distinct error categories, as outlined in Table S4 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. For instance, in row 1 of <xref ref-type="table" rid="table1">Table 1</xref>, the LLM missed “absence of period” as it was implicitly mentioned in the post as “haven’t had a period since December.” Similarly, in row 3, “insulin resistance” is an ambiguous expression to be accepted as a symptom. However, a deeper analysis revealed 3 findings supporting the acceptability of the lexicon.</p>
          <p>First, post-level JI analysis; our manual investigation showed that 12.6% (63/500) of the posts had a JI score of 0, which substantially affected the average JI. We found that most of these JIs with a value of 0 resulted from very short posts (eg, “Does anyone know if weightloss in PCOS helps or throws off hormones?”) and were annotated as <italic>no symptom</italic> by humans, whereas the LLM incorrectly extracted the key phrases <italic>weightloss</italic> and <italic>hormones</italic>. The median JI score across all posts was 1.0 (IQR 0.5-1.0), indicating strong agreement between the LLM and human annotations in most cases.</p>
          <p>Second, lexicon-level robustness; we observed that the LLM missed a key phrase in a post, resulting in a mismatch, but extracted the same key phrase in another post. Similar cases were found for human annotation, resulting in incorrect extraction for the LLM. We identified such cases for 61% (104/172) of the total missed or incorrectly extracted key phrases, which affected the average JI. As the final lexicon aggregates key phrases across all posts, these disagreements at the post level did not propagate to the lexicon level. When comparing the LLM-derived lexicon with the human-annotated lexicon, we observed a JI of 0.89, demonstrating strong alignment between the 2. This high agreement confirmed that discrepancies in per-post extraction had minimal impact on the final lexicon’s accuracy and coverage.</p>
          <p>Third, downstream impact on symptom list; the frequency of unique incorrectly extracted key phrases in the lexicon was very low (maximum of 3). Consequently, their influence on the cluster centroids was negligible. Because our symptom list was derived by selecting the most frequent phrases within each cluster, the effect of noisy or rare phrases was minimized. Such key phrases either formed microclusters (eg, <italic>ultrasound</italic>) that were discarded during the normalization step or were absorbed into broader, validated symptom cluster categories.</p>
          <table-wrap position="float" id="table1">
            <label>Table 1</label>
            <caption>
              <p>Sample excerpts of human and ChatGPT annotations of posts. The Jaccard index (JI) was calculated for the similarity between the 2 annotations based on the extracted key phrases.</p>
            </caption>
            <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
              <col width="500"/>
              <col width="200"/>
              <col width="200"/>
              <col width="100"/>
              <thead>
                <tr valign="top">
                  <td>Post</td>
                  <td>Human annotation</td>
                  <td>ChatGPT annotation</td>
                  <td>JI score</td>
                </tr>
              </thead>
              <tbody>
                <tr valign="top">
                  <td>“I haven’t had a period since December, however in the past week I keep getting really bad cramping with sharp pains (almost feels like my ovaries), but no period...has anyone else experienced this? Is this normal?”</td>
                  <td>“Absence of period,” “cramping,” and “sharp pains”</td>
                  <td>“Cramping” and “sharp pains”</td>
                  <td>0.67</td>
                </tr>
                <tr valign="top">
                  <td>“I’m 22, F and over the years, I have gained 50 pounds. Recently, my acne is getting worse and I feel pressure in my pelvic area. I am trying to lose weight and thereby started working out but the scale is still not budging.”</td>
                  <td>“Weight gain,” “acne,” and “pelvic pressure”</td>
                  <td>“Weight gain,” “acne,” and “pelvic pressure”</td>
                  <td>1.0</td>
                </tr>
                <tr valign="top">
                  <td>“Due to PCOS and insulin resistance, Does anyone else get symptoms like they’re getting their period (sore breasts, crampy feeling) and just overall malaise when you’re ‘due’ for your period you don’t actually get?”</td>
                  <td>“Insulin resistance,” “sore breasts,” and “crampy feeling”</td>
                  <td>“Sore breasts,” “crampy feeling,” and “malaise”</td>
                  <td>0.5</td>
                </tr>
              </tbody>
            </table>
          </table-wrap>
          <p>In summary, while there were post-level discrepancies, the high lexicon-level JI (0.89) and the robustness of frequency-based clustering ensured that the final symptom list remained accurate and representative of human annotation without prohibitive annotation burden.</p>
        </sec>
        <sec>
          <title>Symptom Identification</title>
          <sec>
            <title>Overview</title>
            <p>In this step, we identified a distinct set of disease symptoms using the symptom-related lexicon. As the key phrases in the lexicon were captured exactly as mentioned in users’ posts, many were semantically similar with different phrasing. For example, key phrases such as <italic>cystic ovary</italic>, <italic>ovarian cysts</italic>, and <italic>multiple cysts in ovaries</italic> have the same semantic meaning with different surface forms. Thus, we used clustering to categorize the semantically similar key phrases and identify such categories as unique symptoms. To ensure accurate clustering, it is crucial to generate meaningful representations of symptom-related key phrases that effectively capture their semantic meaning. To achieve this, we used embeddings, which convert words into numeric representations in lower dimensions that preserve their contexts. The process of embedding and clustering the key phrases is described in the following sections.</p>
          </sec>
          <sec>
            <title>Choosing the Right Embedding</title>
            <p>We explored and evaluated widely used transformer models such as BERT-Base [<xref ref-type="bibr" rid="ref48">48</xref>], Phrase-BERT [<xref ref-type="bibr" rid="ref49">49</xref>], and BioBERT [<xref ref-type="bibr" rid="ref50">50</xref>] to generate embeddings of symptom-related key phrases. We observed the performance of these embeddings by applying various clustering methods. For k-means clustering, we analyzed the silhouette score for each BERT-based embedding. The silhouette score considers both within-cluster and intercluster variances to determine cluster quality [<xref ref-type="bibr" rid="ref51">51</xref>]. We plotted silhouette scores of different embedding approaches, shown in <xref rid="figure2" ref-type="fig">Figure 2</xref>A. The curves for BERT-Base and Phrase-BERT show a general increase but noticeable fluctuation, representing inconsistency in the results. In contrast, BioBERT shows a consistent and uniform ascent compared to the other 2 in the silhouette curve. Furthermore, applying L2 normalization during embedding improved the uniqueness of the clusters [<xref ref-type="bibr" rid="ref48">48</xref>]. The consistent superiority of BioBERT across all clustering approaches steered our decision to adopt BioBERT as our embedding method.</p>
            <fig id="figure2" position="float">
              <label>Figure 2</label>
              <caption>
                <p>Characteristic analysis of embedding methods for selecting optimal clustering methods—(A) silhouette score analysis of different embeddings on k-means and (B) rate of change in inertia (within-cluster sum of the squares) decreasing as the number of clusters increases. BERT: bidirectional encoder representations from transformers.</p>
              </caption>
              <graphic xlink:href="medinform_v13i1e70940_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
            </fig>
          </sec>
          <sec>
            <title>Selecting the Optimal Clustering Method</title>
            <p>We exploited k-means and hierarchical density-based spatial clustering of applications with noise (HDBSCAN) with BioBERT embeddings for clustering symptom-related key phrases. Comparing k-means and HDBSCAN is fairly tricky as their hyperparameters (number of clusters vs density thresholds) are fundamentally different. Although it is widely known that HDBSCAN performs better for noisy social media data as it filters out “low-density” points as noise, the choice of clustering method depends on the downstream task and the performance on specific data. In Table S5 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>, we report the performance of HDBSCAN under a grid of <italic>min_cluster_size</italic> and <italic>min_samples</italic> settings with the observations of cluster numbers, density-based clustering validation (DBCV) score, and noise. The DBCV score measures how dense and well separated core clusters are in a density-based clustering method [<xref ref-type="bibr" rid="ref52">52</xref>]. Thus, HDBSCAN with lower <italic>minimum_cluster_size</italic> increases in DBCV scores indicates compactness of the clusters but may generate spurious microclusters. Manual observation shows that HDBSCAN with lower <italic>minimum_cluster_size</italic> provides better intracluster coherence but reduce intercluster separation and generate more semantically similar clusters, such as <italic>increased testosterone</italic> and <italic>elevated level of testosterone</italic>. In contrast, an increasing <italic>minimum_cluster_size</italic> results in lower DBCV scores. As a result, the number of clusters decreases, which may contribute to losing meaningful clusters by being too strict on cluster size. For such instances, elements of the <italic>cysts on ovaries</italic> cluster represents less coherence and semantic similarity in HDBSCAN compared to k-means shown in (<xref rid="figure3" ref-type="fig">Figure 3</xref>). In our use case, HDBSCAN labeled 31% to 56% of the points as noise across settings. This affected the downstream task as our goal was to maximize symptom coverage. On the other hand, k-means has no noise filtering, which ensures maximum coverage of symptoms. In addition, we implemented k-means using the cosine distance to improve the cluster uniqueness with fewer duplicates compared to using the Euclidean distance [<xref ref-type="bibr" rid="ref53">53</xref>].</p>
            <fig id="figure3" position="float">
              <label>Figure 3</label>
              <caption>
                <p>Comparison of elements within the cluster "cysts on ovaries" between 2 clustering methods: (A) k-means, containing semantically similar key phrases that are evenly distributed, and (B) hierarchical density-based spatial clustering of applications with noise, containing key phrases conflicting with the cluster name, highlighted in red, and showing more uneven distribution.</p>
              </caption>
              <graphic xlink:href="medinform_v13i1e70940_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
            </fig>
          </sec>
          <sec>
            <title>Sensitivity and Stability Analysis in Choosing the <italic>k</italic> Value</title>
            <p>We varied the number of clusters (<italic>k</italic>) to determine the optimal number based on the silhouette score (in <xref rid="figure2" ref-type="fig">Figure 2</xref>A) and rate of change in inertia (in <xref rid="figure2" ref-type="fig">Figure 2</xref>B). In our PCOS use case, we identified that, after <italic>k</italic>=100, the change in inertia became flat and the rate of increment in silhouette score was also negligible. Therefore, we set <italic>k</italic> to range from 10 to 100, and at <italic>k</italic>=96, we observed an optimal silhouette score. In addition, we explored a –10 to +10 window for <italic>k</italic>=96 to verify the sensitivity of the resulting clusters. Across <italic>k</italic>=86 to 106, the silhouette score remained within approximately –0.01 to +0.01 of its value at <italic>k</italic>=96, and the inertia curve showed minimal change, confirming that the choice of <italic>k</italic> sat in the middle of a stable region. In addition, we report the bootstrap stability results for 3 representative choices between <italic>k</italic>=86 and 96. All 3 settings yielded high median Adjusted Rand Index (ARI) values (≥0.75) and narrow 95% CIs, demonstrating that cluster assignments are largely consistent when up to 20% of the data are held out. We provide a summary of the sensitivity and stability analysis of the choice of <italic>k</italic> in k-means in Table S6 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p>
          </sec>
        </sec>
        <sec>
          <title>Symptom Normalization</title>
          <sec>
            <title>Overview</title>
            <p>Each of the obtained clusters represented a symptom as the elements of the clusters were semantically similar. We considered the most frequent element of the cluster as the key symptom. The justification for selecting the most frequent element as the key symptom was 2-fold. First, its occurrences were significantly higher than those of other elements within the cluster. For instance, occurrences of <italic>cysts on ovaries</italic> compared to other elements within the cluster in <xref rid="figure3" ref-type="fig">Figure 3</xref>A were negligible. Second, all elements within a cluster consistently pointed toward the same physical condition as the key symptom. In the k-means cluster in <xref rid="figure3" ref-type="fig">Figure 3</xref>A, all the cluster elements referred to ovarian cysts. However, there were repetitions of symptoms in the obtained list. Therefore, we conducted symptom normalization by applying semantic mapping and validation by experts, as outlined in the following sections.</p>
          </sec>
          <sec>
            <title>Applying Semantic Mapping</title>
            <p>We applied semantic mapping of clusters, a manual process that involves merging symptoms with similar meanings and concepts using Unified Medical Language System Metathesaurus synonyms to avoid repetition. Through progressive discussions with our medical specialist, we formalized 4 semantic mapping rules suitable for this task. For instance, <italic>irregular bleeding</italic>, <italic>irregular menstrual cycles</italic>, and <italic>irregular cycles</italic> were mapped to <italic>irregular periods</italic> using rule 1, “synonym merging.” Applying these rules, we consolidated 11 such mappings from the initial 96 PCOS symptoms to 68 unique symptoms. The complete rule set is provided in Table S7 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> to ensure reproducibility.</p>
          </sec>
          <sec>
            <title>Validation by an Expert</title>
            <p>We further refined the symptom list by validating the relevance of the lived experiences of patients to the disease. One of our coauthors, a gynecologist with &#62;10 years of experience in treating PCOS, conducted this validation step. The expert’s role was to discard symptoms that were not related to the disease and resolve ambiguities between similar symptoms. For instance, the medical specialist discarded 4 irrelevant symptoms—<italic>ultrasound</italic>, <italic>birth control</italic>, <italic>low-carb diet</italic>, and <italic>neck</italic>—by manually investigating the cluster elements, resulting in a comprehensive list of 64 unique PCOS symptoms.</p>
          </sec>
        </sec>
      </sec>
      <sec>
        <title>Ethical Considerations</title>
        <p>We acknowledge that the research on symptom extraction from social media has multifaceted ethical concerns and requires careful attention to privacy, consent, and the responsible use of data and technology. The research was approved by Bangladesh University of Engineering and Technology's Institutional Review Board. Although Reddit is an anonymous platform, we ensured that no personally identifiable information was inadvertently revealed during data collection, analysis, or publication. All Reddit posts and comments cited as examples in this paper were paraphrased to protect user privacy. We also recognize that the demographic composition of Reddit users might not be fully representative of the broader population with PCOS, potentially limiting generalizability. Therefore, findings derived from Reddit discourse should be generalized cautiously to other populations or settings. In addition, we recognize that any biases in the dataset and the proposed model are unintentional. As the outcomes of this work are based on social media content, we emphasize the superiority of medical evidence–based facts in cases of conflict, particularly concerning direct clinical practice and medical diagnosis. We strongly encourage the use of the model for research and exploratory purposes, serving as a foundation for further developments in computational health research.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Test Data Curation and Ground Truth Annotation</title>
        <p>We initially separated 1000 sample posts of various lengths from our dataset for results evaluation. Considering the influence of post length on symptom identification, we categorized the posts into three groups: (1) short posts of &#60;100 words, (2) medium-length posts of between 100 and 300 words, and (3) long posts of &#62;300 words. Post length distribution in the dataset revealed that 45% (450/1000) of the posts belonged to the medium-length category (Table S8 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). To ensure a balance across all categories, we selected 500 posts from the medium-length category and 250 posts from each of the short and long post categories for curating test data.</p>
        <p>We recruited a medical graduate with domain knowledge and a patient with PCOS lived experience to perform annotation. Before annotation, both annotators participated in progressive training sessions and interactive discussions with medical specialists to refine their understanding and improve annotation consistency. During this phase, the medical specialist primarily identified 3 potential disagreements between the annotators. These observed disagreements were instances in which (1) the medical graduate often used clinical terminology (eg, “amenorrhea”) whereas the patient used informal language (eg, “no period for months”); (2) the patient included self-reported experiences (eg, “hypothyroidism”) that lacked clinical validation whereas the clinician strictly adhered to established PCOS diagnostic criteria; and (3) the medical graduate inferred implicit symptoms (eg, laboratory test results) from domain knowledge, which was lacking in the patient annotation. Given our goal to prioritize the capture of patient-experienced symptoms, medical specialists suggested resolving these discrepancies by (1) avoiding overly technical clinical terms unless they were explicitly mentioned, (2) retaining self-reported experiences unless they were clinically invalid, and (3) including implicit symptoms as long as they were related to PCOS. Following these guidelines, both annotators extracted symptoms independently. We adopted the combination of both annotators’ symptom lists per post to maximize coverage and ensure the consistency and reliability of the ground truth dataset.</p>
        <p>In our ground truth annotation, annotators were not restricted to predefined symptom lists. They identified any symptoms that they perceived as PCOS related, resulting in free-text labels. Moreover, each post included multiple symptoms, making the traditional Cohen κ not suitable. Instead, we evaluated interannotator agreement using relaxed-match <italic>F</italic><sub>1</sub>-score due to the generative nature of our annotation [<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref54">54</xref>,<xref ref-type="bibr" rid="ref55">55</xref>]. We used BioBERT-based semantic similarity with the medical graduate’s annotation as a reference. We achieved an <italic>F</italic><sub>1</sub>-score of 0.82, with a recall of 0.84 at a similarity threshold of 0.6, indicating substantial agreement considering the realistic complexity inherent in patient-derived, generative-nature symptom annotation.</p>
      </sec>
      <sec>
        <title>Symptom Comparison: LSE With eHealth Forums</title>
        <p>LSE resulted in a comprehensive list of 64 unique PCOS symptoms (<xref ref-type="table" rid="table2">Table 2</xref>) from 10,500 user posts. We also determined the unique users reporting each symptom in our primary dataset, with counts ranging from 31 to 16,001. This confirmed that LSE captures widely experienced symptoms, whereas less common symptoms are not ignored. In addition, this list provides a wide range of coverage as we cross-checked it with 7 evidence-based consumer health websites: the World Health Organization [<xref ref-type="bibr" rid="ref31">31</xref>]; the Mayo Clinic [<xref ref-type="bibr" rid="ref56">56</xref>]; WebMD [<xref ref-type="bibr" rid="ref57">57</xref>]; the <italic>International Classification of Diseases, 10th Revision</italic> [<xref ref-type="bibr" rid="ref58">58</xref>]; Johns Hopkins Medicine [<xref ref-type="bibr" rid="ref59">59</xref>]; the National Health Service [<xref ref-type="bibr" rid="ref60">60</xref>]; and the Centers for Disease Control and Prevention [<xref ref-type="bibr" rid="ref61">61</xref>]. All symptoms mentioned in these sources were included in our list except for 4: sleep apnea, high blood pressure, low progesterone, and dandruff. Upon examining the clusters, we found that these 4 symptoms were represented within their respective key clusters—<italic>insomnia</italic>, <italic>high cholesterol</italic>, <italic>low estrogen</italic>, and <italic>high DHEA</italic>—due to their close medical relevance. Furthermore, all the forums recognized the 10 most frequently reported symptoms in our dataset (Table S9 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). On the other hand, we identified 28 symptoms not acknowledged by any of the eHealth forums that we mention as potentially emerging symptoms in the Discussion section. Thus, our comprehensive symptom list reflects the diversity of self-reported PCOS lived experience symptoms and aligns closely with authoritative medical sources, helping standardize the variability in the symptom descriptions.</p>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Comprehensive list of 64 polycystic ovary syndrome symptoms extracted via lexicon-based symptom extraction. The counts represent the number of unique users reporting each symptom across the primary dataset. The symptoms in italics represent potentially emerging symptoms.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="600"/>
            <col width="400"/>
            <thead>
              <tr valign="top">
                <td>Symptom</td>
                <td>Unique users reporting the symptom, n</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Hirsutism</td>
                <td>16,001</td>
              </tr>
              <tr valign="top">
                <td>Acne</td>
                <td>14,256</td>
              </tr>
              <tr valign="top">
                <td>Cysts on ovaries</td>
                <td>13,781</td>
              </tr>
              <tr valign="top">
                <td>Pain</td>
                <td>13,495</td>
              </tr>
              <tr valign="top">
                <td>Weight gain</td>
                <td>13,150</td>
              </tr>
              <tr valign="top">
                <td>Mood swings</td>
                <td>11,523</td>
              </tr>
              <tr valign="top">
                <td>Insulin resistance</td>
                <td>9859</td>
              </tr>
              <tr valign="top">
                <td>Irregular period</td>
                <td>9702</td>
              </tr>
              <tr valign="top">
                <td>Infertility</td>
                <td>7558</td>
              </tr>
              <tr valign="top">
                <td>Cramps</td>
                <td>7043</td>
              </tr>
              <tr valign="top">
                <td>Diabetes</td>
                <td>6690</td>
              </tr>
              <tr valign="top">
                <td>Spotting</td>
                <td>6469</td>
              </tr>
              <tr valign="top">
                <td>
                  <italic>Hypothyroidism</italic>
                </td>
                <td>5366</td>
              </tr>
              <tr valign="top">
                <td>No period</td>
                <td>4846</td>
              </tr>
              <tr valign="top">
                <td>Anovulation</td>
                <td>4755</td>
              </tr>
              <tr valign="top">
                <td>
                  <italic>Nausea</italic>
                </td>
                <td>4600</td>
              </tr>
              <tr valign="top">
                <td>
                  <italic>Cravings</italic>
                </td>
                <td>4566</td>
              </tr>
              <tr valign="top">
                <td>Fatigue</td>
                <td>4342</td>
              </tr>
              <tr valign="top">
                <td>Bloating</td>
                <td>4048</td>
              </tr>
              <tr valign="top">
                <td>Headaches</td>
                <td>4028</td>
              </tr>
              <tr valign="top">
                <td>Heavy period</td>
                <td>3846</td>
              </tr>
              <tr valign="top">
                <td>Hair loss</td>
                <td>3517</td>
              </tr>
              <tr valign="top">
                <td>High testosterone</td>
                <td>2794</td>
              </tr>
              <tr valign="top">
                <td>Skin issues</td>
                <td>2695</td>
              </tr>
              <tr valign="top">
                <td>Hormone imbalance</td>
                <td>2648</td>
              </tr>
              <tr valign="top">
                <td>Inflammation</td>
                <td>2457</td>
              </tr>
              <tr valign="top">
                <td>
                  <italic>Endometriosis</italic>
                </td>
                <td>2303</td>
              </tr>
              <tr valign="top">
                <td>
                  <italic>High DHEA</italic>
                  <sup>a</sup>
                </td>
                <td>2231</td>
              </tr>
              <tr valign="top">
                <td>
                  <italic>Loss of appetite</italic>
                </td>
                <td>2013</td>
              </tr>
              <tr valign="top">
                <td>
                  <italic>Painful periods</italic>
                </td>
                <td>1906</td>
              </tr>
              <tr valign="top">
                <td>Insomnia</td>
                <td>1513</td>
              </tr>
              <tr valign="top">
                <td>
                  <italic>Dizziness</italic>
                </td>
                <td>1471</td>
              </tr>
              <tr valign="top">
                <td>
                  <italic>Night sweats</italic>
                </td>
                <td>1457</td>
              </tr>
              <tr valign="top">
                <td>
                  <italic>Stomach pain</italic>
                </td>
                <td>1374</td>
              </tr>
              <tr valign="top">
                <td>
                  <italic>Blood clots</italic>
                </td>
                <td>1187</td>
              </tr>
              <tr valign="top">
                <td>
                  <italic>Anemia</italic>
                </td>
                <td>1162</td>
              </tr>
              <tr valign="top">
                <td>
                  <italic>Brain fog</italic>
                </td>
                <td>1158</td>
              </tr>
              <tr valign="top">
                <td>
                  <italic>Vomiting</italic>
                </td>
                <td>1134</td>
              </tr>
              <tr valign="top">
                <td>High androgen</td>
                <td>1121</td>
              </tr>
              <tr valign="top">
                <td>Oily skin</td>
                <td>912</td>
              </tr>
              <tr valign="top">
                <td>
                  <italic>Back pain</italic>
                </td>
                <td>843</td>
              </tr>
              <tr valign="top">
                <td>
                  <italic>Digestive issues</italic>
                </td>
                <td>826</td>
              </tr>
              <tr valign="top">
                <td>
                  <italic>Constipation</italic>
                </td>
                <td>813</td>
              </tr>
              <tr valign="top">
                <td>Pelvic pain</td>
                <td>742</td>
              </tr>
              <tr valign="top">
                <td>Belly fat</td>
                <td>731</td>
              </tr>
              <tr valign="top">
                <td>Acanthosis nigricans</td>
                <td>616</td>
              </tr>
              <tr valign="top">
                <td>High cholesterol</td>
                <td>613</td>
              </tr>
              <tr valign="top">
                <td>High insulin</td>
                <td>575</td>
              </tr>
              <tr valign="top">
                <td>
                  <italic>Low libido</italic>
                </td>
                <td>575</td>
              </tr>
              <tr valign="top">
                <td>
                  <italic>Abdominal pain</italic>
                </td>
                <td>564</td>
              </tr>
              <tr valign="top">
                <td>
                  <italic>Ovary pain</italic>
                </td>
                <td>496</td>
              </tr>
              <tr valign="top">
                <td>
                  <italic>Dry skin</italic>
                </td>
                <td>480</td>
              </tr>
              <tr valign="top">
                <td>High estrogen</td>
                <td>480</td>
              </tr>
              <tr valign="top">
                <td>
                  <italic>Stretch marks</italic>
                </td>
                <td>439</td>
              </tr>
              <tr valign="top">
                <td>Low estrogen</td>
                <td>436</td>
              </tr>
              <tr valign="top">
                <td>Brown discharge</td>
                <td>426</td>
              </tr>
              <tr valign="top">
                <td>Skin tags</td>
                <td>399</td>
              </tr>
              <tr valign="top">
                <td>
                  <italic>Breast tenderness</italic>
                </td>
                <td>376</td>
              </tr>
              <tr valign="top">
                <td>
                  <italic>High prolactin</italic>
                </td>
                <td>331</td>
              </tr>
              <tr valign="top">
                <td>
                  <italic>Pain during sex</italic>
                </td>
                <td>261</td>
              </tr>
              <tr valign="top">
                <td>
                  <italic>Frequent urination</italic>
                </td>
                <td>160</td>
              </tr>
              <tr valign="top">
                <td>
                  <italic>Redness</italic>
                </td>
                <td>108</td>
              </tr>
              <tr valign="top">
                <td>
                  <italic>Weight loss</italic>
                </td>
                <td>45</td>
              </tr>
              <tr valign="top">
                <td>High LH<sup>b</sup> level</td>
                <td>31</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table2fn1">
              <p><sup>a</sup>DHEA: dehydroepiandrosterone.</p>
            </fn>
            <fn id="table2fn2">
              <p><sup>b</sup>LH: luteinizing hormone.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Baseline Comparisons</title>
        <sec>
          <title>Overview</title>
          <p>We compared the performance of LSE with leading baselines, including 2 popular off-the-shelf models—Amazon Comprehend Medical (ACM) [<xref ref-type="bibr" rid="ref62">62</xref>] and Google Healthcare Natural Language API (GHNLP) [<xref ref-type="bibr" rid="ref63">63</xref>]—in their default configuration. In addition, we evaluated both open-source and closed-source LLMs, namely, Llama 3.1 (8B) and GPT-4o in a zero-shot, near-0 temperature (0.25) setting. We identified symptoms in each post of the test dataset using all the baselines for comparison with the ground truth. For LSE, we used GPT-4o to identify symptoms guided by the comprehensive symptom list obtained through our method. Therefore, it was not strictly zero-shot but, rather, a form of lexicon-guided prompting. The model’s task was to match symptoms in the text against the LSE-provided symptom lexicon. To ensure reproducibility, we included the LLM prompt templates used for the baseline comparisons (GPT-4o and Llama 3.1), shown in Figure S3 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>, and LSE evaluation using GPT-4o, as detailed in Figure S4 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. We evaluated competitive models using standard performance metrics—precision, recall, and <italic>F</italic><sub>1</sub>-score. To measure the similarity between symptoms, we used BioBERT-based semantic similarity as it performs optimally with medical data. Given the nuanced nature of symptom expressions, we set the different semantic similarity thresholds at 0.4, 0.6, and 0.8 for match acceptance, and the corresponding performance results are reported in <xref ref-type="table" rid="table3">Table 3</xref>. Experimental results show that LSE outperformed all baselines significantly across all metrics at every threshold level. As expected, increasing the similarity threshold imposed stricter matching criteria, resulting in fewer accepted symptom matches. Consequently, the performance of all baseline models dropped significantly with higher thresholds. In contrast, the performance of LSE decreased only marginally, highlighting the stability and robustness of our framework. For all subsequent analyses in this study, we adopted a semantic similarity threshold of 0.6 as the default setting. Several additional useful insights from the results are discussed in the following sections.</p>
          <table-wrap position="float" id="table3">
            <label>Table 3</label>
            <caption>
              <p>Comparing lexicon-based symptom extraction (LSE) with off-the-shelf medical information extraction tools and large language models in terms of precision, recall, and F1-score across different post lengths.</p>
            </caption>
            <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
              <col width="30"/>
              <col width="150"/>
              <col width="80"/>
              <col width="70"/>
              <col width="90"/>
              <col width="80"/>
              <col width="70"/>
              <col width="90"/>
              <col width="80"/>
              <col width="70"/>
              <col width="90"/>
              <col width="100"/>
              <thead>
                <tr valign="top">
                  <td colspan="2">Model</td>
                  <td colspan="10">Post length<break/>  <break/>  </td>
                </tr>
                <tr valign="top">
                  <td colspan="2">
                    <break/>
                  </td>
                  <td colspan="3">≤100 words</td>
                  <td colspan="3">&#62;100 to 300 words</td>
                  <td colspan="3">&#62;300 words</td>
                  <td>For all length, mean <italic>F</italic><sub>1</sub>-score</td>
                </tr>
                <tr valign="top">
                  <td colspan="2">
                    <break/>
                  </td>
                  <td>Precision</td>
                  <td>Recall</td>
                  <td><italic>F</italic><sub>1</sub>-score</td>
                  <td>Precision</td>
                  <td>Recall</td>
                  <td><italic>F</italic><sub>1</sub>-score</td>
                  <td>Precision</td>
                  <td>Recall</td>
                  <td><italic>F</italic><sub>1</sub>-score</td>
                  <td/>
                </tr>
              </thead>
              <tbody>
                <tr valign="top">
                  <td colspan="12">
                    <bold>Similarity threshold of 0.4</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>ACM<sup>a</sup></td>
                  <td>55.27</td>
                  <td>79.85</td>
                  <td>61.21<sup>b</sup></td>
                  <td>39.28</td>
                  <td>89.50</td>
                  <td>51.30</td>
                  <td>31.77</td>
                  <td>91.21</td>
                  <td>45.36</td>
                  <td>52.30</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>GHNLP<sup>c</sup></td>
                  <td>59.96</td>
                  <td>63.41</td>
                  <td>58.69<sup>b</sup></td>
                  <td>49.39</td>
                  <td>65.79</td>
                  <td>51.76</td>
                  <td>45.29</td>
                  <td>68.30</td>
                  <td>51.25</td>
                  <td>53.37</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Llama 3.1 (8B)</td>
                  <td>53.26</td>
                  <td>73.00</td>
                  <td>57.38</td>
                  <td>62.49</td>
                  <td>79.11</td>
                  <td>65.91<sup>b</sup></td>
                  <td>63.07</td>
                  <td>74.00</td>
                  <td>64.66</td>
                  <td>63.47</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>GPT-4o</td>
                  <td>64.15</td>
                  <td>60.25</td>
                  <td>60.77</td>
                  <td>79.61</td>
                  <td>74.72</td>
                  <td>74.81</td>
                  <td>84.21</td>
                  <td>71.62</td>
                  <td>75.33<sup>b</sup></td>
                  <td>71.41</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>LSE</td>
                  <td>86.09</td>
                  <td>85.02</td>
                  <td>84.60</td>
                  <td>87.85</td>
                  <td>88.54</td>
                  <td>86.89</td>
                  <td>92.09</td>
                  <td>90.76</td>
                  <td>90.33<sup>b</sup></td>
                  <td>87.17<sup>d</sup></td>
                </tr>
                <tr valign="top">
                  <td colspan="12">
                    <bold>Similarity threshold of 0.6</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>ACM</td>
                  <td>48.63</td>
                  <td>68.61</td>
                  <td>53.45<sup>b</sup></td>
                  <td>33.47</td>
                  <td>76.29</td>
                  <td>43.85</td>
                  <td>28.85</td>
                  <td>81.14</td>
                  <td>40.30</td>
                  <td>45.37</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>GHNLP</td>
                  <td>47.82</td>
                  <td>49.54</td>
                  <td>46.64<sup>b</sup></td>
                  <td>35.52</td>
                  <td>46.78</td>
                  <td>37.31</td>
                  <td>35.24</td>
                  <td>53.00</td>
                  <td>40.02</td>
                  <td>40.32</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Llama 3.1 (8B)</td>
                  <td>48.20</td>
                  <td>63.42</td>
                  <td>51.60</td>
                  <td>56.47</td>
                  <td>71.48</td>
                  <td>59.64<sup>b</sup></td>
                  <td>55.86</td>
                  <td>64.96</td>
                  <td>57.27</td>
                  <td>57.04</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>GPT-4o</td>
                  <td>59.05</td>
                  <td>55.63</td>
                  <td>56.02</td>
                  <td>72.11</td>
                  <td>68.86</td>
                  <td>68.57</td>
                  <td>77.97</td>
                  <td>66.86</td>
                  <td>70.14<sup>b</sup></td>
                  <td>65.80</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>LSE</td>
                  <td>84.89</td>
                  <td>83.82</td>
                  <td>83.40</td>
                  <td>86.64</td>
                  <td>87.42</td>
                  <td>85.78</td>
                  <td>91.20</td>
                  <td>89.57</td>
                  <td>89.42<sup>b</sup></td>
                  <td>86.10<sup>d</sup></td>
                </tr>
                <tr valign="top">
                  <td colspan="12">
                    <bold>Similarity threshold of 0.8</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>ACM</td>
                  <td>37.66</td>
                  <td>51.10</td>
                  <td>41.13<sup>b</sup></td>
                  <td>20.68</td>
                  <td>46.07</td>
                  <td>26.87</td>
                  <td>18.58</td>
                  <td>52.81</td>
                  <td>26.63</td>
                  <td>30.38</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>GHNLP</td>
                  <td>37.85</td>
                  <td>40.01</td>
                  <td>37.62<sup>b</sup></td>
                  <td>24.45</td>
                  <td>33.15</td>
                  <td>26.18</td>
                  <td>25.83</td>
                  <td>39.23</td>
                  <td>29.54</td>
                  <td>29.88</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Llama 3.1 (8B)</td>
                  <td>41.12</td>
                  <td>52.23</td>
                  <td>43.60<sup>b</sup></td>
                  <td>40.81</td>
                  <td>51.59</td>
                  <td>43.13</td>
                  <td>40.39</td>
                  <td>45.41</td>
                  <td>40.96</td>
                  <td>42.71</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>GPT-4o</td>
                  <td>49.76</td>
                  <td>47.88</td>
                  <td>43.60</td>
                  <td>55.17</td>
                  <td>52.12</td>
                  <td>52.21</td>
                  <td>60.49</td>
                  <td>51.07</td>
                  <td>54.18<sup>b</sup></td>
                  <td>51.60</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>LSE</td>
                  <td>80.00</td>
                  <td>79.33</td>
                  <td>78.81</td>
                  <td>83.04</td>
                  <td>83.29</td>
                  <td>82.02</td>
                  <td>86.78</td>
                  <td>85.33</td>
                  <td>85.12<sup>b</sup></td>
                  <td>81.99<sup>d</sup></td>
                </tr>
              </tbody>
            </table>
            <table-wrap-foot>
              <fn id="table3fn1">
                <p><sup>a</sup>ACM: Amazon Comprehend Medical.</p>
              </fn>
              <fn id="table3fn2">
                <p><sup>b</sup>For these values, the highest value obtained by a model among the 3-length range.</p>
              </fn>
              <fn id="table3fn3">
                <p><sup>c</sup>GHNLP: Google Healthcare Natural Language Application Programming Interface.</p>
              </fn>
              <fn id="table3fn4">
                <p><sup>d</sup>For these values, the LSE obtained the highest <italic>F</italic><sub>1</sub>-scores among all models in all the threshold-settings.</p>
              </fn>
            </table-wrap-foot>
          </table-wrap>
        </sec>
        <sec>
          <title>Off-the-Shelf Models Tend to Overpredict</title>
          <p>The GHNLP and ACM models largely extracted generic symptoms that were not disease specific, such as <italic>pregnancy</italic>, <italic>cold</italic>, <italic>sick</italic>, <italic>illness</italic>, and <italic>discomfort</italic>. In addition, they extracted mental conditions such as <italic>anxiety</italic>, <italic>overwhelmed</italic>, and <italic>feeling bad</italic> as PCOS symptoms. As a result, they identified more symptoms (4.84 and 9.05 per post by GHNLP and ACM on average, respectively) compared to the ground truth (mean 2.76, SD 1.90 per post). Moreover, they struggled to comprehend the context of the post content, often extracting medical jargon such as <italic>side effect</italic>, <italic>lab report</italic>, and <italic>medication</italic> as symptoms. Substantially, GHNLP and ACM extracted 64% (2874/4463) and 70% (5691/8161) incorrect symptoms, respectively, of the total symptoms identified (<xref rid="figure4" ref-type="fig">Figure 4</xref>). Longer posts aggravated these issues as the presence of more jargon further reduced the precision and <italic>F</italic><sub>1</sub>-scores of these models (<xref ref-type="table" rid="table3">Table 3</xref>). However, both models achieved better recall than precision due to overprediction.</p>
          <fig id="figure4" position="float">
            <label>Figure 4</label>
            <caption>
              <p>Performance comparison of different models in identifying symptom occurrences from 1000 sample posts. Each bar represents the number of correctly identified, not identified, and incorrectly identified symptoms stacked on top of each other. ACM: Amazon Comprehend Medical; GHNLP: Google Healthcare Natural Language Application Programming Interface; LSE: lexicon-based symptom extraction.</p>
            </caption>
            <graphic xlink:href="medinform_v13i1e70940_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
        <sec>
          <title>Baselines Struggle to Capture Nuanced Symptoms</title>
          <p>All the baselines struggled to detect subtle symptoms, specifically when they were stated in informal language. As a result, GHNLP correctly identified only 50% (1589/3124) of the ground truth symptoms, whereas the LLMs showed better performance with approximately 65% (4133/6248) correct matches (<xref rid="figure4" ref-type="fig">Figure 4</xref>). Although ACM achieved a 79% (2470/3124) match with the ground truth, its overall performance was hindered by significant overpredictions. For instance, a PCOS symptom, <italic>high testosterone</italic>, was mentioned informally in the following post, but only LSE and none of the baselines could identify it:</p>
          <disp-quote>
            <p>I had two sets of blood tests taken last year, which showed that my hormones (especially testosterone) were all over the place. My GP said that my test results were enough to confirm PCOS diagnosis.</p>
          </disp-quote>
        </sec>
        <sec>
          <title>LSE Outperformed State-of-the-Art LLMs</title>
          <p><xref rid="figure4" ref-type="fig">Figure 4</xref> shows that, while LLMs significantly reduced the number of incorrectly identified symptoms, they still missed a notable number of symptoms. Leveraging the symptom list generated by LSE in the base prompt for generative pretrained transformers increased the number of correctly identified symptoms, enhancing overall performance. The high values for LSE across all metrics in <xref ref-type="table" rid="table3">Table 3</xref> indicate that the comprehensive symptom list effectively covered all PCOS lived experience symptoms while filtering out generic ones.</p>
        </sec>
        <sec>
          <title>Statistical Significance</title>
          <p>We also compared the <italic>F</italic><sub>1</sub>-score of LSE with those of the baselines using the approximated randomization test [<xref ref-type="bibr" rid="ref28">28</xref>] with a similarity threshold of 0.6 to determine whether the results were statistically significant. As this test does not require specific distributional assumptions, it is particularly suitable for complex metrics such as the <italic>F</italic><sub>1</sub>-score [<xref ref-type="bibr" rid="ref64">64</xref>]. We conducted pairwise comparisons between symptoms extracted from a post via LSE and each of the baselines. The number of occurrences in the sample set of 1000 posts in which LSE significantly outperformed the baselines at 95% (<italic>P</italic>&#60;.05) and 90% (<italic>P</italic>&#60;.10) confidence levels. The observed results suggest that, in terms of the <italic>F</italic><sub>1</sub>-score, LSE significantly outperformed all the other baselines shown in Table S10 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p>
        </sec>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Analysis of PCOS Symptomatology</title>
        <sec>
          <title>Overview</title>
          <p>Our study was motivated by the limitations of existing information extraction methods in identifying symptom expressions from colloquial patient narratives. We propose an LSE method incorporating LLMs into the pipeline to capture disease-specific symptoms from social media discourse. We focused on PCOS as a representative case given its highly variable and often underdocumented symptomatology. We evaluated LSE against multiple strong baselines across a manually annotated Reddit dataset, and it demonstrated substantial improvements in precision, recall, and <italic>F</italic><sub>1</sub>-score.</p>
          <p>We conducted an in-depth study of PCOS symptomatology to evaluate the characteristics, prevalence, and occurrence patterns of the symptoms, capturing implicit insights from patient-generated data. We also highlighted how capturing symptoms in patient-centric language can bridge gaps between patient experiences and clinical practice, potentially enhancing health care provider communication and guiding clinical decision-making.</p>
        </sec>
        <sec>
          <title>Potentially Emerging Symptoms</title>
          <p>We identified 28 distinct symptoms from our comprehensive symptom list prominently reported by patients yet currently underrepresented or insufficiently explored in established medical literature and not acknowledged by existing eHealth sources (highlighted in italics in <xref ref-type="table" rid="table2">Table 2</xref>). Although many of these symptoms currently lack robust clinical evidence linking them directly to PCOS, their frequent occurrence in patient-generated data suggests that patients often experience and associate these symptoms with PCOS. As illustrated in <xref rid="figure5" ref-type="fig">Figure 5</xref>, the number of unique users reporting some of these symptoms, such as hypothyroidism and brain fog, demonstrate a consistent upward reporting trend over time. Moreover, some recent studies have provided medical evidence supporting the connection between some of these symptoms and PCOS, such as brain fog, thyroid disorder, low libido, digestive issues, and cravings [<xref ref-type="bibr" rid="ref65">65</xref>-<xref ref-type="bibr" rid="ref69">69</xref>]. Therefore, we marked them as potentially emerging symptoms. However, while frequently reported by patients, it is important to recognize that these symptoms might not represent entirely novel manifestations of PCOS. Instead, they may reflect less common but known clinical symptoms, secondary manifestations of the primary disease, or symptoms associated with frequently co-occurring conditions. For example, hypothyroidism, reported by 5366 users, reflects a well-established thyroid-PCOS comorbidity [<xref ref-type="bibr" rid="ref66">66</xref>], underscoring potential shared pathophysiological mechanisms rather than indicating a novel PCOS symptom. In addition, nausea and cravings, although frequently reported by patients, advocate for a broader and patient-inclusive diagnostic perspective rather than confirming direct causality. These emerging findings reinforce the credibility of patient-reported underdocumented symptoms and underscore the necessity for rigorous clinical investigation to determine their prevalence, pathophysiological connections, and implications for diagnosis and treatment protocols.</p>
          <fig id="figure5" position="float">
            <label>Figure 5</label>
            <caption>
              <p>Instances of potentially emerging symptoms mentioned by users in the primary dataset, showing notable upward trends over time.</p>
            </caption>
            <graphic xlink:href="medinform_v13i1e70940_fig5.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
        <sec>
          <title>Capturing Symptoms in Patient-Centric Language</title>
          <p>LSE captured the lived experience symptoms as expressed by the patients. This approach makes the symptoms more accessible to laypersons compared to clinical terminology and jargon. Some symptoms with unorthodox clinical terms require complex medical tests to diagnose, whereas their effects are often evident in lived experiences, and hence, these symptoms are included in the symptom list. For instance, hyperandrogenism is a symptom that may not be familiar to all users and requires laboratory tests, whereas hirsutism, acne, or hair loss are visible outcomes of the condition that are easily recognized and commonly reported by users, as shown in <xref ref-type="table" rid="table2">Table 2</xref>.</p>
        </sec>
        <sec>
          <title>Identifying Co-Occurrence of Symptoms</title>
          <p>We constructed a symptom co-occurrence matrix in which multiple symptoms mentioned by an individual in a single post or comment were considered as co-occurring. <xref rid="figure6" ref-type="fig">Figure 6</xref> illustrates a segment of the matrix highlighting the most frequently mentioned symptom pairs with their number of co-occurrences. The eHealth forums further complemented these co-occurrences. Understanding these co-occurring symptoms raises awareness among the community and helps individuals better cope with their condition. In addition, such analysis can assist health care providers and patients in proactively diagnosing and managing symptoms such as hirsutism, oily skin, and acne, as observed in the following comment:</p>
          <disp-quote>
            <p>The best natural remedy I’ve tried is spearmint supplement. I’m a thin cysterbut have most of the other symptoms and it has been the only thing I’ve foundso far that helps with hirsutism, oily skin, acne.</p>
          </disp-quote>
          <fig id="figure6" position="float">
            <label>Figure 6</label>
            <caption>
              <p>A segment of the symptom co-occurrence matrix, where hirsutism and acne appear as one of the most frequently mentioned symptom pairs.</p>
            </caption>
            <graphic xlink:href="medinform_v13i1e70940_fig6.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
        <sec>
          <title>Association With Chronic Diseases and Comorbidity</title>
          <p>We identified 8 chronic diseases from the list of PCOS symptoms that were distinct medical conditions in their own right. For example, chronic conditions such as hypothyroidism and endometriosis were mentioned by 5366 and 2303 unique users, respectively (<xref ref-type="table" rid="table2">Table 2</xref>). The association with chronic diseases and comorbidity increases the complexity of the disease and its management and significantly impacts social determinants of health, as shown in the following example:</p>
          <disp-quote>
            <p>I went to the ER...but they found cysts on my ovaries and mentioned PCOS with possibly Endometriosis. Now, I have no insurance and I’m struggling to find the care. My husband and I want to start a family, but I feel like our chances are slipping away because I can’t afford the help I need. Any advice on where to get financial or medical support would be greatly appreciated.</p>
          </disp-quote>
          <p>The financial strain from frequent physician visits and prolonged medications impacts patients’ overall health outcomes. This emphasizes the need for clinical and public health research to find ways to reduce the burden on patients, such as overprescription and cost. This may also involve policy reforms to ensure comprehensive coverage for chronic conditions associated with PCOS.</p>
        </sec>
        <sec>
          <title>Enhancing Patient–Health Care Provider Communication</title>
          <p>The comprehensive symptom list generated by our lexicon-based approach, encompassing both widely recognized and emerging patient-reported symptoms, provides clinicians with a deeper insight into how patients perceive and articulate their condition. For example, terms such as <italic>brain fog</italic>, <italic>pelvic pressure</italic>, and <italic>fatigue</italic> are not only clinically relevant but also capture the nuanced ways in which patients describe their daily experiences with PCOS. Studies also show that using patient-generated health-related terminology during visits deepens shared understanding and decision‑making [<xref ref-type="bibr" rid="ref70">70</xref>]. Therefore, clinicians can leverage this enriched vocabulary to enhance patient–health care provider communication, promoting empathy, validating patient experiences, and facilitating more targeted and personalized clinical interviews.</p>
        </sec>
        <sec>
          <title>Guide to Clinical Decision-Making</title>
          <p>The patient-derived symptom list (<xref ref-type="table" rid="table2">Table 2</xref>) can serve as a preliminary checklist during consultations to identify overlooked or underdiscussed symptoms that patients might hesitate to share spontaneously due to stigma or uncertainty. Documenting co-occurrence patterns further empowers clinicians to anticipate linked symptoms. A patient presenting with hirsutism, for instance, could be screened for insulin resistance or acne, enabling early intervention and holistic management. To scale these benefits, the symptom list can be integrated into electronic health record systems. This integration allows for auto-completion prompts that reflect patient language while supporting consistent clinical documentation. Such structured integration enhances clinical decision-making through automated reminders and promotes interoperability for population-level research. Acknowledging patient-reported symptoms does not undermine established clinical evidence; rather, it complements traditional clinical frameworks by incorporating patient perspectives into evidence-based medicine.</p>
        </sec>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>Despite the promising results, this study has several limitations. First, our study focused on a single health condition and a single social media platform, which may introduce platform-specific biases and limit generalizability. Second, both the lexicon and the evaluation sample sizes are relatively small for broader conclusions. Third, our findings are exploratory and hypothesis generating and not yet clinically validated.</p>
        <p>We also acknowledge specific implementation limitations. Although the LSE pipeline is designed for modularity and adaptability, applying it to other complex health conditions may require empirical adjustments. Determining optimal clusters for symptom identification and establishing semantic mapping rules for symptom normalization would require condition-specific customization. In this study, we used silhouette scores and inertia analysis to determine the optimal cluster metrics, such as the number of clusters (<italic>k</italic>). However, we recognize the limitation of distance-based metrics due to the curse of dimensionality, which may not fully capture cluster shape or density nuances. Despite this, our bootstrap stability analysis demonstrated consistently high Adjusted Rand Index (ARI) values across various <italic>k</italic> settings, indicating that our symptom clusters were robust to moderate changes in the number of clusters and to the random removal of data points. The performance of this framework may vary depending on the extracted lexicon due to linguistic variability and the nature of symptom discourse. Future work should focus on validating this method across diverse conditions, platforms, and languages. In addition, we plan to conduct online surveys and focus groups involving both patients and practitioners to assess the clinical relevance of our findings.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>This work focused on extracting and analyzing disease-specific symptoms from individuals’ lived experiences with an application to the PCOS use case. The uniqueness of our work lies in several key aspects. The extraction of a symptom-related lexicon ensures the capture of subtle mentions without overlooking informal expressions on social media. We generated disease-specific symptoms by integrating LLMs into the NLP pipeline rather than relying on traditional NLP methods, which often obtain generic symptoms. In addition, analyzing PCOS symptomatology across varied dimensions revealed unique findings, such as emerging new symptoms expressed in patient-centric language, symptom co-occurrence patterns, and associated comorbidities. The outcomes of this work may help eliminate uncertainties surrounding complex medical conditions and contribute to clinical research and public health policies in a community-informed way.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Supplementary tables, prompts, and results.</p>
        <media xlink:href="medinform_v13i1e70940_app1.doc" xlink:title="DOC File , 797 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">ACM</term>
          <def>
            <p>Amazon Comprehend Medical</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">API</term>
          <def>
            <p>application programming interface</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">BERT</term>
          <def>
            <p>bidirectional encoder representations from transformers</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">DBCV</term>
          <def>
            <p>density-based clustering validation</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">GHNLP</term>
          <def>
            <p>Google Healthcare Natural Language Application Programming Interface</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">HDBSCAN</term>
          <def>
            <p>hierarchical density-based spatial clustering of applications with noise</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">JI</term>
          <def>
            <p>Jaccard index</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">LLM</term>
          <def>
            <p>large language model</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb9">LSE</term>
          <def>
            <p>lexicon-based symptom extraction</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb10">NLP</term>
          <def>
            <p>natural language processing</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb11">PCOS</term>
          <def>
            <p>polycystic ovary syndrome</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>This work was partially supported by the Information and Communication Technology Division of Bangladesh under a postgraduate research fellowship grant. The funding body had no involvement in the study design; data collection, analysis, or experimentation; writing of the report; or decision to submit the paper for publication.</p>
    </ack>
    <notes>
      <sec>
        <title>Data Availability</title>
        <p>We have publicly released our curated Reddit dataset and human-annotated labeled dataset. To support reproducibility, all source code and resources used in this study have also been made available. The datasets and related materials can be accessed through our GitHub repository [<xref ref-type="bibr" rid="ref71">71</xref>].</p>
      </sec>
    </notes>
    <fn-group>
      <fn fn-type="con">
        <p>BH conceptualized the study, curated the data, designed the methodology, and organized this study; analyzed the results; and wrote, reviewed, and revised the manuscript. SMP and MEA contributed to conceptualization; supervision; validation of the results; and writing, review, and revision of the manuscript. MFR analyzed the results and contributed to writing, reviewing, and revising the manuscript. RA conceptualized the study, validated the results, and reviewed and revised the manuscript.</p>
      </fn>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kemp</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Digital 2023: global overview report</article-title>
          <source>DataReportal</source>
          <year>2023</year>
          <month>01</month>
          <day>26</day>
          <access-date>2025-05-25</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://datareportal.com/reports/digital-2023-global-overview-report">https://datareportal.com/reports/digital-2023-global-overview-report</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="web">
          <article-title>National health interview survey</article-title>
          <source>Centers for Disease Control and Prevention</source>
          <access-date>2025-05-25</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.cdc.gov/nchs/nhis/2022nhis.htm">https://www.cdc.gov/nchs/nhis/2022nhis.htm</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jelodar</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Orji</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Deep sentiment classification and topic discovery on novel coronavirus or COVID-19 online discussions: NLP using LSTM recurrent neural network approach</article-title>
          <source>IEEE J Biomed Health Inform</source>
          <year>2020</year>
          <month>10</month>
          <volume>24</volume>
          <issue>10</issue>
          <fpage>2733</fpage>
          <lpage>42</lpage>
          <pub-id pub-id-type="doi">10.1109/JBHI.2020.3001216</pub-id>
          <pub-id pub-id-type="medline">32750931</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chopra</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zehrung</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Shanmugam</surname>
              <given-names>TA</given-names>
            </name>
            <name name-style="western">
              <surname>Choe</surname>
              <given-names>EK</given-names>
            </name>
          </person-group>
          <article-title>Living with uncertainty and stigma: self-experimentation and support-seeking around polycystic ovary syndrome</article-title>
          <source>Proceedings of the 2021 CHI Conference on Human Factors in Computing Systems</source>
          <year>2021</year>
          <conf-name>CHI '21</conf-name>
          <conf-date>May 8-13, 2021</conf-date>
          <conf-loc>Yokohama, Japan</conf-loc>
          <pub-id pub-id-type="doi">10.1145/3411764.3445706</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>LL</given-names>
            </name>
            <name name-style="western">
              <surname>Wilson</surname>
              <given-names>SR</given-names>
            </name>
            <name name-style="western">
              <surname>Lohmann</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Negraia</surname>
              <given-names>DV</given-names>
            </name>
          </person-group>
          <article-title>What are you anxious about? examining subjects of anxiety during the COVID-19 pandemic</article-title>
          <source>Proceedings of the Int AAAI Conf Web Soc Media</source>
          <year>2023</year>
          <month>06</month>
          <day>02</day>
          <volume>17</volume>
          <issue>1</issue>
          <fpage>137</fpage>
          <lpage>48</lpage>
          <pub-id pub-id-type="doi">10.1609/icwsm.v17i1.22133</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Attai</surname>
              <given-names>DJ</given-names>
            </name>
            <name name-style="western">
              <surname>Cowher</surname>
              <given-names>MS</given-names>
            </name>
            <name name-style="western">
              <surname>Al-Hamadani</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Schoger</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Staley</surname>
              <given-names>AC</given-names>
            </name>
            <name name-style="western">
              <surname>Landercasper</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Twitter social media is an effective tool for breast cancer patient education and support: patient-reported outcomes by survey</article-title>
          <source>J Med Internet Res</source>
          <year>2015</year>
          <month>07</month>
          <day>30</day>
          <volume>17</volume>
          <issue>7</issue>
          <fpage>e188</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2015/7/e188/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/jmir.4721</pub-id>
          <pub-id pub-id-type="medline">26228234</pub-id>
          <pub-id pub-id-type="pii">v17i7e188</pub-id>
          <pub-id pub-id-type="pmcid">PMC4705354</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jeon</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Baruah</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Sarabadani</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Palanica</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Identification of risk factors and symptoms of COVID-19: analysis of biomedical literature and social media data</article-title>
          <source>J Med Internet Res</source>
          <year>2020</year>
          <month>10</month>
          <day>02</day>
          <volume>22</volume>
          <issue>10</issue>
          <fpage>e20509</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2020/10/e20509/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/20509</pub-id>
          <pub-id pub-id-type="medline">32936770</pub-id>
          <pub-id pub-id-type="pii">v22i10e20509</pub-id>
          <pub-id pub-id-type="pmcid">PMC7537723</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sendra</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Farré</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Vaagan</surname>
              <given-names>RW</given-names>
            </name>
          </person-group>
          <article-title>Seeking, sharing and co-creating: a systematic review of the relation between social support theory, social media use and chronic diseases</article-title>
          <source>Soc Theory Health</source>
          <year>2019</year>
          <month>05</month>
          <day>27</day>
          <volume>18</volume>
          <fpage>317</fpage>
          <lpage>39</lpage>
          <pub-id pub-id-type="doi">10.1057/s41285-019-00106-z</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>McKillop</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Mamykina</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Elhadad</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Designing in the dark: eliciting self-tracking dimensions for understanding enigmatic disease</article-title>
          <source>Proceedings of the 2018 CHI Conference on Human Factors in Computing Systems</source>
          <year>2018</year>
          <conf-name>CHI '18</conf-name>
          <conf-date>April 21-26, 2018</conf-date>
          <conf-loc>Montreal, QC</conf-loc>
          <pub-id pub-id-type="doi">10.1145/3173574.3174139</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lentscher</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Decherney</surname>
              <given-names>AH</given-names>
            </name>
          </person-group>
          <article-title>Clinical presentation and diagnosis of polycystic ovarian syndrome</article-title>
          <source>Clin Obstet Gynecol</source>
          <year>2021</year>
          <month>03</month>
          <day>01</day>
          <volume>64</volume>
          <issue>1</issue>
          <fpage>3</fpage>
          <lpage>11</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/32701517"/>
          </comment>
          <pub-id pub-id-type="doi">10.1097/GRF.0000000000000563</pub-id>
          <pub-id pub-id-type="medline">32701517</pub-id>
          <pub-id pub-id-type="pii">00003081-202103000-00003</pub-id>
          <pub-id pub-id-type="pmcid">PMC10683967</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Porta</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Greenland</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Hernán</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>dos Santos Silva</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Last</surname>
              <given-names>JM</given-names>
            </name>
          </person-group>
          <source>A Dictionary of Epidemiology</source>
          <year>2014</year>
          <publisher-loc>Oxford, UK</publisher-loc>
          <publisher-name>Oxford University Press</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Romano</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Sharif</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Basak</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Gatto</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Preum</surname>
              <given-names>SM</given-names>
            </name>
          </person-group>
          <article-title>Theme-driven keyphrase extraction to analyze social media discourse</article-title>
          <source>Proc Int AAAI Conf Web Soc Media</source>
          <year>2024</year>
          <month>05</month>
          <day>28</day>
          <volume>18</volume>
          <issue>1</issue>
          <fpage>1315</fpage>
          <lpage>27</lpage>
          <pub-id pub-id-type="doi">10.1609/icwsm.v18i1.31391</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ohno</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Aomori</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Nishiyama</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Kato</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Fujiki</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Ishikawa</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Kiyomiya</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Isawa</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Mochizuki</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Aramaki</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Ohtani</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Performance improvement of a natural language processing tool for extracting patient narratives related to medical states from Japanese pharmaceutical care records by increasing the amount of training data: natural language processing analysis and validation study</article-title>
          <source>JMIR Med Inform</source>
          <year>2025</year>
          <month>03</month>
          <day>04</day>
          <volume>13</volume>
          <fpage>e68863</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2025//e68863/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/68863</pub-id>
          <pub-id pub-id-type="medline">40053805</pub-id>
          <pub-id pub-id-type="pii">v13i1e68863</pub-id>
          <pub-id pub-id-type="pmcid">PMC11920660</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Molenaar</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Lukose</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Brennan</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Jenkins</surname>
              <given-names>EL</given-names>
            </name>
            <name name-style="western">
              <surname>McCaffrey</surname>
              <given-names>TA</given-names>
            </name>
          </person-group>
          <article-title>Using natural language processing to explore social media opinions on food security: sentiment analysis and topic modeling study</article-title>
          <source>J Med Internet Res</source>
          <year>2024</year>
          <month>03</month>
          <day>21</day>
          <volume>26</volume>
          <fpage>e47826</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2024//e47826/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/47826</pub-id>
          <pub-id pub-id-type="medline">38512326</pub-id>
          <pub-id pub-id-type="pii">v26i1e47826</pub-id>
          <pub-id pub-id-type="pmcid">PMC10995791</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Schoene</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Ji</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Ananiadou</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Natural language processing applied to mental illness detection: a narrative review</article-title>
          <source>NPJ Digit Med</source>
          <year>2022</year>
          <month>04</month>
          <day>08</day>
          <volume>5</volume>
          <issue>1</issue>
          <fpage>46</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41746-022-00589-7"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41746-022-00589-7</pub-id>
          <pub-id pub-id-type="medline">35396451</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41746-022-00589-7</pub-id>
          <pub-id pub-id-type="pmcid">PMC8993841</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sharif</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Gatto</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Basak</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Preum</surname>
              <given-names>SM</given-names>
            </name>
          </person-group>
          <article-title>Explicit, implicit, and scattered: revisiting event extraction to capture complex arguments</article-title>
          <source>Proceedings of the 2024 Conference on Empirical Methods in Natural Language Processing</source>
          <year>2024</year>
          <conf-name>EMNLP 2024</conf-name>
          <conf-date>November 12-16, 2024</conf-date>
          <conf-loc>Miami, FL</conf-loc>
          <pub-id pub-id-type="doi">10.18653/v1/2024.emnlp-main.673</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Guo</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Ovadje</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Al-Garadi</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Sarker</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Evaluating large language models for health-related text classification tasks with public social media data</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2024</year>
          <month>10</month>
          <day>01</day>
          <volume>31</volume>
          <issue>10</issue>
          <fpage>2181</fpage>
          <lpage>9</lpage>
          <pub-id pub-id-type="doi">10.1093/jamia/ocae210</pub-id>
          <pub-id pub-id-type="medline">39121174</pub-id>
          <pub-id pub-id-type="pii">7731085</pub-id>
          <pub-id pub-id-type="pmcid">PMC11413434</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Agarwal</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Searle</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Ratas</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Shek</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Teo</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Dobson</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Improving extraction of clinical event contextual properties from electronic health records: a comparative study</article-title>
          <source>ArXiv</source>
          <comment>Preprint posted online on August 30, 2024</comment>
          <pub-id pub-id-type="doi">10.48550/arXiv.2408.17181</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bai</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Mulvenna</surname>
              <given-names>MD</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Bond</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Clinical entity extraction: comparison between MetaMap, cTAKES, CLAMP and Amazon comprehend medical</article-title>
          <source>Proceedings of the 32nd Irish Signals and Systems Conference</source>
          <year>2021</year>
          <conf-name>ISSC 2021</conf-name>
          <conf-date>June 10-11, 2021</conf-date>
          <conf-loc>Athlone, Ireland</conf-loc>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1109/ISSC52156.2021.9467856"/>
          </comment>
          <pub-id pub-id-type="doi">10.1109/issc52156.2021.9467856</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Peng</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Havrilla</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Weng</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Guthrie</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Schultz</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Natural language processing (NLP) tools in extracting biomedical concepts from research articles: a case study on autism spectrum disorder</article-title>
          <source>BMC Med Inform Decis Mak</source>
          <year>2020</year>
          <month>12</month>
          <day>30</day>
          <volume>20</volume>
          <issue>Suppl 11</issue>
          <fpage>322</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedinformdecismak.biomedcentral.com/articles/10.1186/s12911-020-01352-2"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12911-020-01352-2</pub-id>
          <pub-id pub-id-type="medline">33380331</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12911-020-01352-2</pub-id>
          <pub-id pub-id-type="pmcid">PMC7772897</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Agrawal</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Hegselmann</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Lang</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Sontag</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Large language models are few-shot clinical information extractors</article-title>
          <source>ArXiv</source>
          <comment>Preprint posted online on May 25, 2022</comment>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.48550/arXiv.2205.12689"/>
          </comment>
          <pub-id pub-id-type="doi">10.48550/arXiv.2205.12689</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sorbello</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Haque</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Hasan</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Jermyn</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Hussein</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Vega</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Zembrzuski</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Ripple</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ahadpour</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Artificial intelligence-enabled software prototype to inform opioid pharmacovigilance from electronic health records: development and usability study</article-title>
          <source>JMIR AI</source>
          <year>2023</year>
          <volume>2</volume>
          <fpage>e45000</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://ai.jmir.org/2023//e45000/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/45000</pub-id>
          <pub-id pub-id-type="medline">37771410</pub-id>
          <pub-id pub-id-type="pii">e45000</pub-id>
          <pub-id pub-id-type="pmcid">PMC10538589</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Luo</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Gandhi</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Storey</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>A deep language model for symptom extraction from clinical text and its application to extract COVID-19 symptoms from social media</article-title>
          <source>IEEE J Biomed Health Inform</source>
          <year>2022</year>
          <month>04</month>
          <volume>26</volume>
          <issue>4</issue>
          <fpage>1737</fpage>
          <lpage>48</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/34705659"/>
          </comment>
          <pub-id pub-id-type="doi">10.1109/JBHI.2021.3123192</pub-id>
          <pub-id pub-id-type="medline">34705659</pub-id>
          <pub-id pub-id-type="pmcid">PMC9074854</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dolatabadi</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Moyano</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Bales</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Spasojevic</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Bhambhoria</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Bhatti</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Debnath</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Hoell</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Leng</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Nanda</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Saab</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Sahak</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Sie</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Uppal</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Vadlamudi</surname>
              <given-names>NK</given-names>
            </name>
            <name name-style="western">
              <surname>Vladimirova</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Yakimovich</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Kocak</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Cheung</surname>
              <given-names>AM</given-names>
            </name>
          </person-group>
          <article-title>Using social media to help understand patient-reported health outcomes of post-COVID-19 condition: natural language processing approach</article-title>
          <source>J Med Internet Res</source>
          <year>2023</year>
          <month>09</month>
          <day>19</day>
          <volume>25</volume>
          <fpage>e45767</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2023//e45767/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/45767</pub-id>
          <pub-id pub-id-type="medline">37725432</pub-id>
          <pub-id pub-id-type="pii">v25i1e45767</pub-id>
          <pub-id pub-id-type="pmcid">PMC10510753</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ding</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Massey</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Grady</surname>
              <given-names>CB</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Cohen</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Matzner</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Mahajan</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Caraballo</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Kumar</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Xue</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Dreyer</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Roy</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Krumholz</surname>
              <given-names>HM</given-names>
            </name>
          </person-group>
          <article-title>Tracking self-reported symptoms and medical conditions on social media during the COVID-19 pandemic: infodemiological study</article-title>
          <source>JMIR Public Health Surveill</source>
          <year>2021</year>
          <month>09</month>
          <day>28</day>
          <volume>7</volume>
          <issue>9</issue>
          <fpage>e29413</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://publichealth.jmir.org/2021/9/e29413/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/29413</pub-id>
          <pub-id pub-id-type="medline">34517338</pub-id>
          <pub-id pub-id-type="pii">v7i9e29413</pub-id>
          <pub-id pub-id-type="pmcid">PMC8480398</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Babaian</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Entity recognition from colloquial text</article-title>
          <source>Decis Support Syst</source>
          <year>2024</year>
          <month>04</month>
          <volume>179</volume>
          <fpage>114172</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1016/j.dss.2024.114172"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.dss.2024.114172</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Guo</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ma</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Eworuke</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Khashei</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Song</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Jin</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Identifying COVID-19 cases and extracting patient reported symptoms from Reddit using natural language processing</article-title>
          <source>Sci Rep</source>
          <year>2023</year>
          <month>08</month>
          <day>22</day>
          <volume>13</volume>
          <issue>1</issue>
          <fpage>13721</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41598-023-39986-7"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41598-023-39986-7</pub-id>
          <pub-id pub-id-type="medline">37607963</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41598-023-39986-7</pub-id>
          <pub-id pub-id-type="pmcid">PMC10444846</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Goel</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Gueta</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Gilon</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Erell</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Nguyen</surname>
              <given-names>LH</given-names>
            </name>
            <name name-style="western">
              <surname>Hao</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Jaber</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Reddy</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kartha</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Steiner</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Laish</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Feder</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>LLMs accelerate annotation for medical information extraction</article-title>
          <source>ArXiv</source>
          <comment>Preprint posted online on December 4, 2023</comment>
          <pub-id pub-id-type="doi">10.48550/arXiv.2312.02296</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wei</surname>
              <given-names>WI</given-names>
            </name>
            <name name-style="western">
              <surname>Leung</surname>
              <given-names>CL</given-names>
            </name>
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>McNeil</surname>
              <given-names>EB</given-names>
            </name>
            <name name-style="western">
              <surname>Wong</surname>
              <given-names>SY</given-names>
            </name>
            <name name-style="western">
              <surname>Kwok</surname>
              <given-names>KO</given-names>
            </name>
          </person-group>
          <article-title>Extracting symptoms from free-text responses using ChatGPT among COVID-19 cases in Hong Kong</article-title>
          <source>Clin Microbiol Infect</source>
          <year>2024</year>
          <month>01</month>
          <volume>30</volume>
          <issue>1</issue>
          <fpage>142.e1</fpage>
          <lpage>3</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1198-743X(23)00540-2"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.cmi.2023.11.002</pub-id>
          <pub-id pub-id-type="medline">37949111</pub-id>
          <pub-id pub-id-type="pii">S1198-743X(23)00540-2</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Viswaroopan</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>He</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Zuo</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Tao</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Improving entity recognition using ensembles of deep learning and fine-tuned large language models: a case study on adverse event extraction from VAERS and social media</article-title>
          <source>J Biomed Inform</source>
          <year>2025</year>
          <month>03</month>
          <volume>163</volume>
          <fpage>104789</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1016/j.jbi.2025.104789"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2025.104789</pub-id>
          <pub-id pub-id-type="medline">39923968</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(25)00018-8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="web">
          <article-title>Polycystic ovary syndrome</article-title>
          <source>World Health Organization</source>
          <year>2025</year>
          <month>02</month>
          <day>07</day>
          <access-date>2025-05-25</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.who.int/news-room/fact-sheets/detail/polycystic-ovary-syndrome">https://www.who.int/news-room/fact-sheets/detail/polycystic-ovary-syndrome</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Escobar-Morreale</surname>
              <given-names>HF</given-names>
            </name>
          </person-group>
          <article-title>Polycystic ovary syndrome: definition, aetiology, diagnosis and treatment</article-title>
          <source>Nat Rev Endocrinol</source>
          <year>2018</year>
          <month>05</month>
          <volume>14</volume>
          <issue>5</issue>
          <fpage>270</fpage>
          <lpage>84</lpage>
          <pub-id pub-id-type="doi">10.1038/nrendo.2018.24</pub-id>
          <pub-id pub-id-type="medline">29569621</pub-id>
          <pub-id pub-id-type="pii">nrendo.2018.24</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rowlands</surname>
              <given-names>IJ</given-names>
            </name>
            <name name-style="western">
              <surname>Teede</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Lucke</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Dobson</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Mishra</surname>
              <given-names>GD</given-names>
            </name>
          </person-group>
          <article-title>Young women's psychological distress after a diagnosis of polycystic ovary syndrome or endometriosis</article-title>
          <source>Hum Reprod</source>
          <year>2016</year>
          <month>09</month>
          <day>13</day>
          <volume>31</volume>
          <issue>9</issue>
          <fpage>2072</fpage>
          <lpage>81</lpage>
          <pub-id pub-id-type="doi">10.1093/humrep/dew174</pub-id>
          <pub-id pub-id-type="medline">27412249</pub-id>
          <pub-id pub-id-type="pii">dew174</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Malhotra</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Kempegowda</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Appraising unmet needs and misinformation spread about polycystic ovary syndrome in 85,872 YouTube comments over 12 years: big data infodemiology study</article-title>
          <source>J Med Internet Res</source>
          <year>2023</year>
          <month>09</month>
          <day>11</day>
          <volume>25</volume>
          <fpage>e49220</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2023//e49220/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/49220</pub-id>
          <pub-id pub-id-type="medline">37695666</pub-id>
          <pub-id pub-id-type="pii">v25i1e49220</pub-id>
          <pub-id pub-id-type="pmcid">PMC10520765</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Naroji</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>John</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Gomez-Lobo</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>Understanding PCOS-related content across social media platforms-a cross-sectional analysis</article-title>
          <source>J Pediatr Adolesc Gynecol</source>
          <year>2024</year>
          <month>04</month>
          <volume>37</volume>
          <issue>2</issue>
          <fpage>142</fpage>
          <lpage>8</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jpag.2023.10.007</pub-id>
          <pub-id pub-id-type="medline">37992985</pub-id>
          <pub-id pub-id-type="pii">S1083-3188(23)00439-4</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cruz</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Qazi</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Vasireddy</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Vilchez-Russell</surname>
              <given-names>KA</given-names>
            </name>
            <name name-style="western">
              <surname>Stuparich</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Nahas</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Behbehani</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Instagram cysters: what’s available on polycystic ovarian syndrome?</article-title>
          <source>Fertil Steril</source>
          <year>2022</year>
          <month>10</month>
          <volume>118</volume>
          <issue>4</issue>
          <fpage>e323</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.fertstert.org/article/S0015-0282(22)01521-7/fulltext"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Proferes</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Jones</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Gilbert</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Fiesler</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Zimmer</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Studying Reddit: a systematic overview of disciplines, approaches, methods, and ethics</article-title>
          <source>Soc Media Soc</source>
          <year>2021</year>
          <month>05</month>
          <day>26</day>
          <volume>7</volume>
          <issue>2</issue>
          <pub-id pub-id-type="doi">10.1177/20563051211019004</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Boe</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>PRAW: the python Reddit API wrapper</article-title>
          <source>GitHub</source>
          <year>2020</year>
          <access-date>2025-08-13</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://github.com/praw-dev/praw/">https://github.com/praw-dev/praw/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Baumgartner</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <source>Pushshift Reddit API Documentation</source>
          <year>2018</year>
          <access-date>2025-08-27</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://reddit-api.readthedocs.io/">https://reddit-api.readthedocs.io/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Patel</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Timsina</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Raut</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Freeman</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Levin</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Nadkarni</surname>
              <given-names>GN</given-names>
            </name>
            <name name-style="western">
              <surname>Glicksberg</surname>
              <given-names>BS</given-names>
            </name>
            <name name-style="western">
              <surname>Klang</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Exploring temperature effects on large language models across various clinical tasks</article-title>
          <source>medRxiv</source>
          <comment>Preprint posted online on July 22, 2024</comment>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.medrxiv.org/content/10.1101/2024.07.22.24310824v1"/>
          </comment>
          <pub-id pub-id-type="doi">10.1101/2024.07.22.24310824</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Du</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Peng</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Keloth</surname>
              <given-names>VK</given-names>
            </name>
            <name name-style="western">
              <surname>Zuo</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Jiang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Roberts</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Improving large language models for clinical named entity recognition via prompt engineering</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2024</year>
          <month>09</month>
          <day>01</day>
          <volume>31</volume>
          <issue>9</issue>
          <fpage>1812</fpage>
          <lpage>20</lpage>
          <pub-id pub-id-type="doi">10.1093/jamia/ocad259</pub-id>
          <pub-id pub-id-type="medline">38281112</pub-id>
          <pub-id pub-id-type="pii">7590607</pub-id>
          <pub-id pub-id-type="pmcid">PMC11339492</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ouyang</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Jiang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Almeida</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Wainwright</surname>
              <given-names>CL</given-names>
            </name>
            <name name-style="western">
              <surname>Mishkin</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Agarwal</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Slama</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Ray</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Schulman</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Hilton</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kelton</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Miller</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Simens</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Askell</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Welinder</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Christiano</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Leike</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Lowe</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Training language models to follow instructions with human feedback</article-title>
          <source>Proceedings of the 36th International Conference on Neural Information Processing Systems</source>
          <year>2022</year>
          <conf-name>NIPS'22</conf-name>
          <conf-date>November 28-December 9, 2022</conf-date>
          <conf-loc>New Orleans, LA</conf-loc>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dl.acm.org/doi/10.5555/3600270.3602281"/>
          </comment>
          <pub-id pub-id-type="doi">10.5860/choice.189890</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Leas</surname>
              <given-names>EC</given-names>
            </name>
            <name name-style="western">
              <surname>Ayers</surname>
              <given-names>JW</given-names>
            </name>
            <name name-style="western">
              <surname>Desai</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Dredze</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Hogarth</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>DM</given-names>
            </name>
          </person-group>
          <article-title>Using large language models to support content analysis: a case study of ChatGPT for adverse event detection</article-title>
          <source>J Med Internet Res</source>
          <year>2024</year>
          <month>05</month>
          <day>02</day>
          <volume>26</volume>
          <fpage>e52499</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2024//e52499/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/52499</pub-id>
          <pub-id pub-id-type="medline">38696245</pub-id>
          <pub-id pub-id-type="pii">v26i1e52499</pub-id>
          <pub-id pub-id-type="pmcid">PMC11099800</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kuo</surname>
              <given-names>HY</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>SY</given-names>
            </name>
          </person-group>
          <article-title>Predicting user engagement in health misinformation correction on social media platforms in Taiwan: content analysis and text mining study</article-title>
          <source>J Med Internet Res</source>
          <year>2025</year>
          <month>01</month>
          <day>23</day>
          <volume>27</volume>
          <fpage>e65631</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2025//e65631/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/65631</pub-id>
          <pub-id pub-id-type="medline">39847418</pub-id>
          <pub-id pub-id-type="pii">v27i1e65631</pub-id>
          <pub-id pub-id-type="pmcid">PMC11803327</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mohr</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Wuhrl</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Klinger</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>CoVERT: a corpus of fact-checked biomedical COVID-19 tweets</article-title>
          <source>Proceedings of the 13th Conference on Language Resources and Evaluation</source>
          <year>2022</year>
          <conf-name>LREC 2022</conf-name>
          <conf-date>June 20-25, 2022</conf-date>
          <conf-loc>Marseille, France</conf-loc>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://aclanthology.org/2022.lrec-1.26.pdf"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Herman Bernardim Andrade</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Nishiyama</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Fujimaki</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Yada</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Wakamiya</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Takagi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kato</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Miyashiro</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Aramaki</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Assessing domain adaptation in adverse drug event extraction on real-world breast cancer records</article-title>
          <source>Int J Med Inform</source>
          <year>2024</year>
          <month>11</month>
          <volume>191</volume>
          <fpage>105539</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1386-5056(24)00202-8"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.ijmedinf.2024.105539</pub-id>
          <pub-id pub-id-type="medline">39084086</pub-id>
          <pub-id pub-id-type="pii">S1386-5056(24)00202-8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sarwar</surname>
              <given-names>TB</given-names>
            </name>
            <name name-style="western">
              <surname>Noor</surname>
              <given-names>NM</given-names>
            </name>
            <name name-style="western">
              <surname>Saef Ullah Miah</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Evaluating keyphrase extraction algorithms for finding similar news articles using lexical similarity calculation and semantic relatedness measurement by word embedding</article-title>
          <source>PeerJ Comput Sci</source>
          <year>2022</year>
          <volume>8</volume>
          <fpage>e1024</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/35875631"/>
          </comment>
          <pub-id pub-id-type="doi">10.7717/peerj-cs.1024</pub-id>
          <pub-id pub-id-type="medline">35875631</pub-id>
          <pub-id pub-id-type="pii">cs-1024</pub-id>
          <pub-id pub-id-type="pmcid">PMC9299267</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Devlin</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>MW</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Toutanova</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Bert: pre-training of deep bidirectional transformers for language understanding</article-title>
          <source>ArXiv</source>
          <comment>Preprint posted online on October 11, 2018</comment>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/1810.04805"/>
          </comment>
          <pub-id pub-id-type="doi">10.18653/v1/N19-1423</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref49">
        <label>49</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Thompson</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Iyyer</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Phrase-BERT: improved phrase embeddings from BERT with an application to corpus exploration</article-title>
          <source>ArXiv</source>
          <comment>Preprint posted online on September 13, 2021</comment>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/2109.06304"/>
          </comment>
          <pub-id pub-id-type="doi">10.18653/v1/2021.emnlp-main.846</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref50">
        <label>50</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Yoon</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>So</surname>
              <given-names>CH</given-names>
            </name>
            <name name-style="western">
              <surname>Kang</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>BioBERT: a pre-trained biomedical language representation model for biomedical text mining</article-title>
          <source>Bioinformatics</source>
          <year>2020</year>
          <month>02</month>
          <day>15</day>
          <volume>36</volume>
          <issue>4</issue>
          <fpage>1234</fpage>
          <lpage>40</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/31501885"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/bioinformatics/btz682</pub-id>
          <pub-id pub-id-type="medline">31501885</pub-id>
          <pub-id pub-id-type="pii">5566506</pub-id>
          <pub-id pub-id-type="pmcid">PMC7703786</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref51">
        <label>51</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shahapure</surname>
              <given-names>KR</given-names>
            </name>
            <name name-style="western">
              <surname>Nicholas</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Cluster quality analysis using silhouette score</article-title>
          <source>Proceedings of the IEEE 7th International Conference on Data Science and Advanced Analytics</source>
          <year>2020</year>
          <conf-name>DSAA 2020</conf-name>
          <conf-date>October 6-9, 2020</conf-date>
          <conf-loc>Sydney, Australia</conf-loc>
          <pub-id pub-id-type="doi">10.1109/dsaa49011.2020.00096</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref52">
        <label>52</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Moulavi</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Jaskowiak</surname>
              <given-names>PA</given-names>
            </name>
            <name name-style="western">
              <surname>Campello</surname>
              <given-names>RJ</given-names>
            </name>
            <name name-style="western">
              <surname>Zimek</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sander</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Density-based clustering validation</article-title>
          <source>Proceedings of the 2014 SIAM International Conference on Data Mining</source>
          <year>2014</year>
          <conf-name>SIAM 2014</conf-name>
          <conf-date>April 24-26, 2014</conf-date>
          <conf-loc>Philadelphia, PA</conf-loc>
          <pub-id pub-id-type="doi">10.1137/1.9781611973440.96</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref53">
        <label>53</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Meng</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Zhuang</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Kaplan</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Han</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Spherical text embedding</article-title>
          <source>Proceedings of the 33rd International Conference on Neural Information Processing Systems</source>
          <year>2019</year>
          <conf-name>NIPS'19</conf-name>
          <conf-date>December 8-14, 2019</conf-date>
          <conf-loc>Vancouver, BC</conf-loc>
        </nlm-citation>
      </ref>
      <ref id="ref54">
        <label>54</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Risch</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Möller</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Gutsch</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Pietsch</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Semantic answer similarity for evaluating question answering models</article-title>
          <source>Proceedings of the 3rd Workshop on Machine Reading for Question Answering</source>
          <year>2021</year>
          <conf-name>MRQA 2021</conf-name>
          <conf-date>November 10, 2021</conf-date>
          <conf-loc>Online</conf-loc>
          <pub-id pub-id-type="doi">10.18653/v1/2021.mrqa-1.15</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref55">
        <label>55</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Gupta</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>CK</given-names>
            </name>
            <name name-style="western">
              <surname>Mishra</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Dai</surname>
              <given-names>HJ</given-names>
            </name>
            <name name-style="western">
              <surname>Wong</surname>
              <given-names>ZS</given-names>
            </name>
            <name name-style="western">
              <surname>Jonnagaddala</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>OpenDeID pipeline for unstructured electronic health record text notes based on rules and transformers: deidentification algorithm development and validation study</article-title>
          <source>J Med Internet Res</source>
          <year>2023</year>
          <month>12</month>
          <day>06</day>
          <volume>25</volume>
          <fpage>e48145</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2023//e48145/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/48145</pub-id>
          <pub-id pub-id-type="medline">38055317</pub-id>
          <pub-id pub-id-type="pii">v25i1e48145</pub-id>
          <pub-id pub-id-type="pmcid">PMC10733816</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref56">
        <label>56</label>
        <nlm-citation citation-type="web">
          <article-title>Mayo clinic</article-title>
          <source>Mayo Foundation for Medical Education and Research</source>
          <access-date>2025-05-25</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mayoclinic.org/">https://www.mayoclinic.org/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref57">
        <label>57</label>
        <nlm-citation citation-type="web">
          <article-title>A Visual Guide to PCOS</article-title>
          <source>WebMD</source>
          <year>2025</year>
          <month>06</month>
          <day>24</day>
          <access-date>2025-08-27</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.webmd.com/women/ss/slideshow-pcos-overview">https://www.webmd.com/women/ss/slideshow-pcos-overview</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref58">
        <label>58</label>
        <nlm-citation citation-type="web">
          <article-title>Free ICD-10-CM data</article-title>
          <source>ICD10Data.com</source>
          <access-date>2025-05-25</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.icd10data.com/ICD10CM">https://www.icd10data.com/ICD10CM</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref59">
        <label>59</label>
        <nlm-citation citation-type="web">
          <article-title>Polycystic ovary syndrome (PCOS)</article-title>
          <source>Johns Hopkins University</source>
          <access-date>2025-05-25</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.hopkinsmedicine.org/health/conditions-and-diseases/polycystic-ovary-syndrome-pcos">https://www.hopkinsmedicine.org/health/conditions-and-diseases/polycystic-ovary-syndrome-pcos</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref60">
        <label>60</label>
        <nlm-citation citation-type="web">
          <article-title>Polycystic ovary syndrome</article-title>
          <source>National Health Service</source>
          <access-date>2025-05-25</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.nhs.uk/conditions/polycystic-ovary-syndrome-pcos/">https://www.nhs.uk/conditions/polycystic-ovary-syndrome-pcos/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref61">
        <label>61</label>
        <nlm-citation citation-type="web">
          <article-title>Diabetes and polycystic ovary syndrome (PCOS)</article-title>
          <source>Centers for Disease Control and Prevention</source>
          <year>2024</year>
          <month>5</month>
          <day>15</day>
          <access-date>2025-05-25</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.cdc.gov/diabetes/risk-factors/pcos-polycystic-ovary-syndrome.html">https://www.cdc.gov/diabetes/risk-factors/pcos-polycystic-ovary-syndrome.html</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref62">
        <label>62</label>
        <nlm-citation citation-type="web">
          <article-title>Amazon comprehend medical</article-title>
          <source>Amazon Web Services</source>
          <access-date>2025-05-25</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://aws.amazon.com/comprehend/medical/">https://aws.amazon.com/comprehend/medical/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref63">
        <label>63</label>
        <nlm-citation citation-type="web">
          <article-title>Cloud healthcare API</article-title>
          <source>Google Cloud</source>
          <access-date>2025-05-25</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://cloud.google.com/healthcare-api?hl=en">https://cloud.google.com/healthcare-api?hl=en</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref64">
        <label>64</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yeh</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>More accurate tests for the statistical significance of result differences</article-title>
          <source>Proceedings of the COLING 2000 Volume 2: The 18th International Conference on Computational Linguistics</source>
          <year>2000</year>
          <conf-name>COLING 2000</conf-name>
          <conf-date>July 31-August 4, 2000</conf-date>
          <conf-loc>Saarbrücken, Germany</conf-loc>
          <pub-id pub-id-type="doi">10.3115/992730.992783</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref65">
        <label>65</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Huddleston</surname>
              <given-names>HG</given-names>
            </name>
            <name name-style="western">
              <surname>Jaswa</surname>
              <given-names>EG</given-names>
            </name>
            <name name-style="western">
              <surname>Casaletto</surname>
              <given-names>KB</given-names>
            </name>
            <name name-style="western">
              <surname>Neuhaus</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Wellons</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Launer</surname>
              <given-names>LJ</given-names>
            </name>
            <name name-style="western">
              <surname>Yaffe</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Associations of polycystic ovary syndrome with indicators of brain health at midlife in the CARDIA cohort</article-title>
          <source>Neurology</source>
          <year>2024</year>
          <month>02</month>
          <day>27</day>
          <volume>102</volume>
          <issue>4</issue>
          <pub-id pub-id-type="doi">10.1212/wnl.0000000000208104</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref66">
        <label>66</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Singla</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Gupta</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Khemani</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Aggarwal</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Thyroid disorders and polycystic ovary syndrome: an emerging relationship</article-title>
          <source>Indian J Endocrinol Metab</source>
          <year>2015</year>
          <volume>19</volume>
          <issue>1</issue>
          <fpage>25</fpage>
          <lpage>9</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.ijem.in/article.asp?issn=2230-8210;year=2015;volume=19;issue=1;spage=25;epage=29;aulast=Singla"/>
          </comment>
          <pub-id pub-id-type="doi">10.4103/2230-8210.146860</pub-id>
          <pub-id pub-id-type="medline">25593822</pub-id>
          <pub-id pub-id-type="pii">IJEM-19-25</pub-id>
          <pub-id pub-id-type="pmcid">PMC4287775</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref67">
        <label>67</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Eftekhar</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Sohrabvand</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Zabandan</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Shariat</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Haghollahi</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Ghahghaei-Nezamabadi</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Sexual dysfunction in patients with polycystic ovary syndrome and its affected domains</article-title>
          <source>Iran J Reprod Med</source>
          <year>2014</year>
          <month>08</month>
          <volume>12</volume>
          <issue>8</issue>
          <fpage>539</fpage>
          <lpage>46</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/25408703"/>
          </comment>
          <pub-id pub-id-type="medline">25408703</pub-id>
          <pub-id pub-id-type="pmcid">PMC4233312</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref68">
        <label>68</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kałużna</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kompf</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Wachowiak-Ochmańska</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Moczko</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Królczyk</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Janicki</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Szapel</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Grzymisławski</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ruchała</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ziemnicka</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Are patients with polycystic ovary syndrome more prone to irritable bowel syndrome?</article-title>
          <source>Endocr Connect</source>
          <year>2022</year>
          <volume>11</volume>
          <issue>4</issue>
          <fpage>e210309</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://ec.bioscientifica.com/view/journals/ec/11/4/EC-21-0309.xml"/>
          </comment>
          <pub-id pub-id-type="doi">10.1530/ec-21-0309</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref69">
        <label>69</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jeanes</surname>
              <given-names>YM</given-names>
            </name>
            <name name-style="western">
              <surname>Reeves</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Gibson</surname>
              <given-names>EL</given-names>
            </name>
            <name name-style="western">
              <surname>Piggott</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>May</surname>
              <given-names>VA</given-names>
            </name>
            <name name-style="western">
              <surname>Hart</surname>
              <given-names>KH</given-names>
            </name>
          </person-group>
          <article-title>Binge eating behaviours and food cravings in women with polycystic ovary syndrome</article-title>
          <source>Appetite</source>
          <year>2017</year>
          <month>02</month>
          <day>01</day>
          <volume>109</volume>
          <fpage>24</fpage>
          <lpage>32</lpage>
          <pub-id pub-id-type="doi">10.1016/j.appet.2016.11.010</pub-id>
          <pub-id pub-id-type="medline">27825940</pub-id>
          <pub-id pub-id-type="pii">S0195-6663(16)30705-X</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref70">
        <label>70</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Staehelin</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Dolata</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Stöckli</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Schwabe</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>How patient-generated data enhance patient-provider communication in chronic care: field study in design science research</article-title>
          <source>JMIR Med Inform</source>
          <year>2024</year>
          <month>09</month>
          <day>10</day>
          <volume>12</volume>
          <fpage>e57406</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2024//e57406/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/57406</pub-id>
          <pub-id pub-id-type="medline">39255481</pub-id>
          <pub-id pub-id-type="pii">v12i1e57406</pub-id>
          <pub-id pub-id-type="pmcid">PMC11422739</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref71">
        <label>71</label>
        <nlm-citation citation-type="web">
          <article-title>Subreddit to symptomatology data and code</article-title>
          <source>GitHib</source>
          <access-date>2025-08-02</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://github.com/bush1987/LSE-Symptomatology">https://github.com/bush1987/LSE-Symptomatology</ext-link>
          </comment>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
