<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMI</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Med Inform</journal-id>
      <journal-title>JMIR Medical Informatics</journal-title>
      <issn pub-type="epub">2291-9694</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v14i1e89534</article-id>
      <article-id pub-id-type="pmid">42155986</article-id>
      <article-id pub-id-type="doi">10.2196/89534</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Extracting Social Determinants of Health From Electronic Health Records: Development and Comparison of Rule-Based and Large Language Model Methods</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Coristine</surname>
            <given-names>Andrew</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Peterson</surname>
            <given-names>Thomas</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>García-Barragán</surname>
            <given-names>Álvaro</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author">
          <name name-style="western">
            <surname>Wang</surname>
            <given-names>Bo</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <xref rid="aff3" ref-type="aff">3</xref>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-3412-3768</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Kabir</surname>
            <given-names>Dia</given-names>
          </name>
          <degrees>MS</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0006-6740-7464</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Clark</surname>
            <given-names>Cheryl Renee</given-names>
          </name>
          <degrees>MD, SCD</degrees>
          <xref rid="aff5" ref-type="aff">5</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-6782-6382</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Choi</surname>
            <given-names>Karmel W</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <xref rid="aff3" ref-type="aff">3</xref>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-3914-2431</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Smoller</surname>
            <given-names>Jordan W</given-names>
          </name>
          <degrees>MD, SCD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Center for Precision Psychiatry</institution>
            <institution>Massachusetts General Hospital</institution>
            <addr-line>Richard B. Simches Research Building</addr-line>
            <addr-line>185 Cambridge Street, 2nd Floor</addr-line>
            <addr-line>Boston, MA, 02114</addr-line>
            <country>United States</country>
            <phone>1 6177249447</phone>
            <email>jsmoller@mgb.org</email>
          </address>
          <xref rid="aff2" ref-type="aff">2</xref>
          <xref rid="aff3" ref-type="aff">3</xref>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-0381-6334</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Center for Precision Psychiatry</institution>
        <institution>Massachusetts General Hospital</institution>
        <addr-line>Boston, MA</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Psychiatric and Neurodevelopmental Genetics Unit</institution>
        <institution>Massachusetts General Hospital</institution>
        <addr-line>Boston, MA</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Department of Psychiatry</institution>
        <institution>Harvard Medical School</institution>
        <addr-line>Boston, MA</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>Broad Institute</institution>
        <addr-line>Cambridge, MA</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff5">
        <label>5</label>
        <institution>Department of Medicine</institution>
        <institution>Brigham and Women's Hospital</institution>
        <addr-line>Boston, MA</addr-line>
        <country>United States</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Jordan W Smoller <email>jsmoller@mgb.org</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2026</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>19</day>
        <month>5</month>
        <year>2026</year>
      </pub-date>
      <volume>14</volume>
      <elocation-id>e89534</elocation-id>
      <history>
        <date date-type="received">
          <day>15</day>
          <month>12</month>
          <year>2025</year>
        </date>
        <date date-type="rev-request">
          <day>8</day>
          <month>1</month>
          <year>2026</year>
        </date>
        <date date-type="accepted">
          <day>14</day>
          <month>4</month>
          <year>2026</year>
        </date>
      </history>
      <copyright-statement>©Bo Wang, Dia Kabir, Cheryl Renee Clark, Karmel W Choi, Jordan W Smoller. Originally published in JMIR Medical Informatics (https://medinform.jmir.org), 19.05.2026.</copyright-statement>
      <copyright-year>2026</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Informatics, is properly cited. The complete bibliographic information, a link to the original publication on https://medinform.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://medinform.jmir.org/2026/1/e89534" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Social determinants of health (SDoH) are critical drivers of health outcomes but are often underdocumented in structured electronic health record (EHR) data. Instead, SDoH are more commonly recorded in unstructured clinical notes, and unlocking this information could have far-reaching implications for advancing population health research and informing clinical decision-making.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>This study develops and systematically evaluates cost-efficient methods for extracting SDoH information from unstructured clinical text using rule-based natural language processing (NLP) and large language model (LLM)–based approaches.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>We constructed a gold-standard annotated corpus comprising clinical text segments from 171 patients in the Mass General Brigham Research Patient Data Registry, covering 7 SDoH domain categories and 23 subcategories. A rule-based system (RBS) was developed and evaluated alongside 7 OpenAI GPT models (GPT-4o, 4.1, 4.1-mini, o4-mini, GPT-5, GPT-5-mini, and o3) under zero-shot and few-shot settings using multiple prompting strategies. We additionally implemented late-fusion ensemble approaches that combined outputs from rule- and LLM-based methods. Performance was assessed using precision, recall, and <italic>F</italic><sub>1</sub>-score, alongside qualitative error analysis.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>The RBS achieved high precision for SDoH domain categories (0.96) but substantially lower recall (0.68). GPT-based models consistently outperformed the RBS in overall recall and <italic>F</italic><sub>1</sub>-scores. The best domain-level performance was observed for GPT-5 and GPT-5-mini in few-shot settings (<italic>F</italic><sub>1</sub>-score=0.89), while o4-mini achieved the highest subcategory-level performance (<italic>F</italic><sub>1</sub>-score=0.88). A late-fusion ensemble integrating RBS and GPT outputs further improved domain-level performance (<italic>F</italic><sub>1</sub>-score=0.92), with balanced precision (0.93) and recall (0.90), but did not improve subcategory-level performance.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>Recent GPT models with advanced reasoning capabilities, including the newly released mini models (eg, o4-mini and GPT-5-mini), demonstrated strong performance for SDoH extraction without task-specific fine-tuning and consistently outperformed the rule-based NLP system. Integrating rule- and LLM-based methods via late fusion further enhanced domain-level extraction performance. Our results demonstrate a cost-efficient framework for the accurate identification of SDoH from clinical text, facilitating downstream population health research and clinical informatics applications.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>social determinants of health</kwd>
        <kwd>electronic health records</kwd>
        <kwd>natural language processing</kwd>
        <kwd>large language model</kwd>
        <kwd>rule-based system</kwd>
        <kwd>information extraction</kwd>
        <kwd>social and behavioral determinants of health</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>Social determinants of health (SDoH) are increasingly recognized as critical factors influencing health outcomes and contributing to health disparities. Unmet social needs, such as financial hardship, food insecurity, housing instability, and lack of social support, are estimated to account for 30%-55% of health outcomes [<xref ref-type="bibr" rid="ref1">1</xref>]. In recent years, electronic health records (EHRs) have been a crucial source of real-world data, with applications in risk stratification, pharmacoepidemiology, treatment response prediction, and more. However, the value of EHR-based research has been limited by the underdocumentation of important patient information, such as SDoH, within structured EHR data. Instead, this information is more commonly captured in unstructured clinical notes [<xref ref-type="bibr" rid="ref2">2</xref>-<xref ref-type="bibr" rid="ref4">4</xref>]. Unlocking the potential of this SDoH information could have far-reaching implications for population health research and inform clinical decision-making [<xref ref-type="bibr" rid="ref2">2</xref>].</p>
      <p>Consequently, a growing body of work has focused on extracting SDoH from narrative clinical notes using natural language processing (NLP). Historically, these efforts have relied on either rule-based [<xref ref-type="bibr" rid="ref5">5</xref>-<xref ref-type="bibr" rid="ref8">8</xref>] or supervised machine learning approaches [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref10">10</xref>]. Although rule-based approaches are interpretable and customizable, they often suffer from low sensitivity because of their dependence on fixed, manually engineered rules. Conversely, supervised learning methods require significant amounts of high-quality annotated training data, which can be cost- and labor-intensive to generate. This dependence on annotated data is reflected in prior studies such as the 2022 n2c2/UW shared task [<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref12">12</xref>], in which the top-performing systems used transformer-based models fine-tuned on annotated corpora. Recent advances in large language models (LLMs) present an opportunity to develop scalable solutions for identifying SDoH without the need for substantial annotated data [<xref ref-type="bibr" rid="ref13">13</xref>-<xref ref-type="bibr" rid="ref15">15</xref>].</p>
      <p>Despite progress, several important gaps remain. First, the scope of SDoH domains addressed in most studies is limited. A 2021 review by Patra et al [<xref ref-type="bibr" rid="ref2">2</xref>] found that smoking status is among the most commonly studied SDoH-related domains, followed by substance abuse and homelessness. By contrast, SDoH factors such as financial problems, social support, food security, and health insurance coverage remain relatively underexplored [<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref16">16</xref>]. Second, rule-based approaches accounted for approximately one-quarter of the reviewed studies (22 out of 82) [<xref ref-type="bibr" rid="ref2">2</xref>]. Among studies exploring the use of LLMs, most have used either open-weight models such as LLaMA-2 (Large Language Model Meta AI 2) and FLAN-T5 (Fine-Tuned Language Net—Text-to-Text Transfer Transformer) [<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref17">17</xref>] or earlier versions of proprietary LLMs like GPT-3.5 [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref14">14</xref>], while more advanced LLMs with superior reasoning capabilities, including in health care contexts [<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref19">19</xref>], remain largely unexplored for SDoH extraction. Notably, a recent study by Keloth et al [<xref ref-type="bibr" rid="ref15">15</xref>] emphasized the importance of evaluating the latest LLMs for this task. Lastly, while fine-tuning open-weight models has gained traction [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref17">17</xref>], the development and systematic evaluation of different prompting strategies with state-of-the-art LLMs, including fusion with rule-based systems (RBSs), remain understudied despite their relevance in resource-constrained settings.</p>
      <p>Our study addresses the aforementioned gaps by developing and evaluating methods to identify 7 SDoH domains from clinical text derived from multiple note types. In addition to commonly studied domains, we emphasize less-explored determinants such as social resources and health insurance status, as well as physical activity, a key behavioral determinant of health. A recent study by Lituiev et al [<xref ref-type="bibr" rid="ref20">20</xref>] used a 2-tier taxonomy with first- and second-level SDoH classes. Similarly, we developed a fine-grained classification system for each domain. For example, within health insurance status, we included subcategories such as adequate insurance coverage, lack of insurance, and government-assisted insurance to capture different levels of access to care and coverage. Inspired by the n2c2/UW shared task [<xref ref-type="bibr" rid="ref21">21</xref>], we further annotated each subcategory with 4 contextual attributes (temporality, experiencer, hypothetical status, and uncertainty). These attributes served as exclusion criteria for defining positive SDoH cases and supported qualitative analysis of the models’ handling of contextual distinctions. This annotation framework was designed to capture richer social context information for downstream applications such as health risk stratification.</p>
      <p>We present 2 complementary NLP approaches for SDoH extraction requiring minimal training and computational resources: an RBS and LLM-based method leveraging state-of-the-art OpenAI GPT models available at the time of experimentation. For the LLM-based approach, rule-based prescreening was used to identify candidate text segments from clinical notes, which were then classified by GPT models. We examined 7 GPT models in both zero-shot and few-shot settings without task-specific fine-tuning, evaluating performance at the segment level. Our prompting strategies incorporated examples that varied in annotation difficulty. This work extends prior studies by systematically evaluating advanced reasoning models and comparing their performance with that of the RBS. Finally, we investigated various ensemble strategies using late fusion to combine both approaches and further improve extraction performance. Overall, this study contributes to addressing key gaps in SDoH research and provides a cost-efficient framework for future clinical NLP applications.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Ethics Considerations</title>
        <p>This study was reviewed and approved by the Mass General Brigham (MGB) Institutional Review Board (protocol 2018P002642), with an informed consent waiver for the use of retrospective medical record data without patient interaction. The study procedures were conducted in accordance with the ethical standards of the relevant national and institutional committees on human experimentation and with the Declaration of Helsinki. Although the clinical notes used in this study were not deidentified, all data access, modeling, and analyses were restricted to authorized researchers and conducted within secure environments behind the MGB firewall. No identifiable patient information is included in the manuscript or its multimedia appendices. Participants did not receive compensation.</p>
      </sec>
      <sec>
        <title>Data Source</title>
        <p>Data were obtained from the MGB Research Patient Data Registry (RPDR) [<xref ref-type="bibr" rid="ref22">22</xref>], a centralized data registry of clinical information from EHRs across the MGB health system. The RPDR database includes approximately 7 million patients from 8 hospitals, including 2 major teaching hospitals, Massachusetts General Hospital and Brigham and Women’s Hospital, encompassing a wide range of patient characteristics, including structured data (demographics, diagnoses, medications, procedures, and laboratory tests) and unstructured narrative notes. We acquired all narrative clinical notes from 95,157 patients enrolled in the MGB Biobank [<xref ref-type="bibr" rid="ref23">23</xref>], with notes spanning March 1976 to November 2021. For this study, we used discharge summaries and progress notes, the latter including inpatient, outpatient, and emergency visit notes.</p>
      </sec>
      <sec>
        <title>SDoH Categories</title>
        <p>We established our SDoH classification schema (<xref rid="figure1" ref-type="fig">Figure 1</xref>) through iterative consultations with subject matter experts in psychology, psychiatry, and health disparities research. The final schema encompasses 7 domains, that is, 6 social and 1 behavioral (physical activity) determinants of health commonly screened in clinical practice [<xref ref-type="bibr" rid="ref24">24</xref>-<xref ref-type="bibr" rid="ref26">26</xref>]. To capture granular social contexts relevant to health outcomes, we further defined multiple subcategories within each domain category. Given the inherent overlap between certain subcategories (eg, “patient recently got laid off” could be characterized as both job loss and unemployment), we developed comprehensive annotation guidelines (see Appendix S2 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>) to ensure consistency and reproducibility in data generation. The schema was also refined to draw more nuanced distinctions. For example, within social resources, we distinguished the subcategories of living with or accompanied by someone and living alone from good social resources and poor social resources to separate the living situation from the quality of social support. The initial taxonomy of 27 subcategories was refined to 23 based on data review and feasibility assessment. Instances falling within a domain category but not matching any specific subcategory were assigned to “N/A” (not applicable).</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Social determinants of health classification schema comprising 7 domains: general financial status (green), employment status (beige), housing status (yellow), health insurance status (purple), food security status (orange), social resources (blue), and physical activity (teal). Domain names are shown in bold, with their corresponding subcategories listed beneath each domain (23 subcategories total).</p>
          </caption>
          <graphic xlink:href="medinform_v14i1e89534_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Gold-Standard Corpus Development</title>
        <p>An initial set of 2000 patients was sampled from the MGB Biobank cohort using stratified sampling based on several key sociodemographic variables: sex, self-reported race, age group (≥65 years vs &#60;65 years), and health insurance type (public vs private payer). This cohort was held out from system development, including lexicon refinement of the RBS, to ensure separation from evaluation. To create a gold-standard dataset, we conducted prescreening using predefined patterns from our RBS (see the next section), including keywords, rules, and regular expression-based matching, to identify sentences in patients’ notes likely containing SDoH information. Following prior work [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref27">27</xref>], for each potential SDoH mention, we extracted text segments with 150 characters of context on either side, providing sufficient information for annotation. We randomly sampled 79 unique text segments for annotator training and a separate set of 226 text segments (10 per subcategory, except “Other job insecurity and employment issues,” which had 6 instances) for primary model validation. These 226 segments were drawn from notes with a median documentation year of 2016 (IQR 2012-2019).</p>
        <p>We developed our annotation workflow using Label Studio [<xref ref-type="bibr" rid="ref28">28</xref>], an open-source data labeling platform (Figure S1 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). Two annotators (BW, a postdoctoral researcher trained in biomedical informatics, and DK, a medical student with experience in neuropsychiatric research) underwent 3 training sessions and calibration meetings before final annotation. Disagreements between annotators were discussed and resolved in consensus meetings, with a clinical psychologist (KC) serving as the tiebreaker. Based on the finalized SDoH classification schema (<xref rid="figure1" ref-type="fig">Figure 1</xref>) and annotation guidelines, we defined 2 multilabel annotation tasks for each text segment:</p>
        <list list-type="bullet">
          <list-item>
            <p>Task 1: Identify mentions of the 7 SDoH domain categories.</p>
          </list-item>
          <list-item>
            <p>Task 2: Identify mentions of the 23 SDoH subcategories.</p>
          </list-item>
        </list>
        <p>Each training session began with a detailed discussion of the annotation guidelines and concluded with an interannotator agreement assessment. After completing 3 training sessions, annotators achieved acceptable interannotator agreement as measured by Krippendorff α [<xref ref-type="bibr" rid="ref29">29</xref>] (α=.88 for domain categories and α=.74 for subcategories). They then independently annotated the final 226 text segments, achieving α=.95 for domain categories, .84 for subcategories alone, and .78 for subcategories with contextual attributes (temporality, experiencer, hypothetical status, and uncertainty), all well above standard thresholds for reliability [<xref ref-type="bibr" rid="ref30">30</xref>].</p>
      </sec>
      <sec>
        <title>Rule-Based System</title>
        <sec>
          <title>Overview</title>
          <p>As illustrated in <xref rid="figure2" ref-type="fig">Figure 2</xref>, we developed an RBS to identify SDoH mentions in clinical notes. The system was implemented using medspaCy [<xref ref-type="bibr" rid="ref31">31</xref>], an open-source clinical NLP library that supports flexible integration of rule-based and machine learning–based algorithms. It uses a pipeline of NLP functions spanning sentence and section detection to concept extraction and contextual analysis to locate, match, and disambiguate SDoH mentions, along with an iterative process of manual testing, review, and refinement based on feedback to optimize model performance. Descriptions of each pipeline component are provided in Appendix S1.3 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p>
          <fig id="figure2" position="float">
            <label>Figure 2</label>
            <caption>
              <p>Rule-based system workflow: clinical notes (as the input) are processed through a text pipeline that includes sentence segmentation, lexicon-based entity matching, and context disambiguation, producing sentences labeled with social determinants of health (SDoH) domain categories and subcategories. The rules were developed through an iterative process involving manual review and refinement.</p>
            </caption>
            <graphic xlink:href="medinform_v14i1e89534_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
        <sec>
          <title>Lexicon Creation and Expansion</title>
          <p>RBS requires a lexicon (a dictionary of relevant query terms) and corresponding rules for identifying matches in clinical text. We developed our SDoH lexicon through a multistep process: seed term curation, lexicon expansion, and iterative filtering and refinement (<xref rid="figure3" ref-type="fig">Figure 3</xref>). The initial lexicon comprised terms related to each domain derived from prior studies and reviews [<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref32">32</xref>-<xref ref-type="bibr" rid="ref36">36</xref>] and SDoH screening tools and surveys (see Appendix S1.1 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). These seed terms were reviewed by a domain expert (CRC) and systematically expanded using (1) synonym identification and hierarchy mapping (hypernymy-hyponymy) through UMLS (Unified Medical Language System) Metathesaurus, and (2) semantic similarity search using text embedding models [<xref ref-type="bibr" rid="ref37">37</xref>-<xref ref-type="bibr" rid="ref42">42</xref>]. For instance, we encoded the MEDLINE N-Gram Set (1-5 grams) [<xref ref-type="bibr" rid="ref43">43</xref>,<xref ref-type="bibr" rid="ref44">44</xref>] using an MPNet-based Sentence-BERT (Bidirectional Encoder Representations from Transformers) model (paraphrase-mpnet-base-v2) [<xref ref-type="bibr" rid="ref41">41</xref>] (which we make publicly available [<xref ref-type="bibr" rid="ref45">45</xref>]) and performed semantic searches using seed terms as queries against the embedded corpus to identify additional relevant SDoH terms. The iterative lexicon filtering step is detailed in Appendix S1.2 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p>
          <fig id="figure3" position="float">
            <label>Figure 3</label>
            <caption>
              <p>Lexicon curation process involving seed term selection, expansion using UMLS (Unified Medical Language System) and embedding-based semantic search, and iterative lexicon filtering. BERT: Bidirectional Encoder Representations from Transformers; BioSentVec: Biomedical Sentence Vector; BioVec: Biomedical Word Vector.</p>
            </caption>
            <graphic xlink:href="medinform_v14i1e89534_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
      </sec>
      <sec>
        <title>LLM-Based Models</title>
        <sec>
          <title>Model selection and configuration</title>
          <p>We used a series of OpenAI GPT models via the Azure OpenAI Service (Microsoft Foundry), deployed within MGB’s Health Insurance Portability and Accountability Act (HIPAA)–compliant Microsoft Azure infrastructure. Using the Chat Completions application programming interface (API), we prompted the models to identify SDoH categories and subcategories in clinical text segments, akin to a hierarchical multilabel classification task.</p>
          <p>While open-weight LLMs continue to improve, frontier proprietary models remain state-of-the-art on many benchmarks, particularly those involving reasoning tasks [<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref46">46</xref>,<xref ref-type="bibr" rid="ref47">47</xref>]. For this study, we selected 7 GPT models for SDoH extraction based on their performance on benchmarks, including HealthBench [<xref ref-type="bibr" rid="ref18">18</xref>], as well as their inference cost: GPT-4o, 4.1, 4.1-mini, 5, 5-mini, o3, and o4-mini (model versions are provided in Appendix S4 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). For reasoning models (ie, GPT-5, 5-mini, o3, and o4-mini), the reasoning effort parameter was set to high. We compared their precision and recall with those of the RBS, evaluated performance (precision, recall, and <italic>F</italic><sub>1</sub>-scores), and conducted error analysis to understand model limitations and performance variability.</p>
        </sec>
        <sec>
          <title>Zero-Shot Prompting</title>
          <p>State-of-the-art LLMs are instruction-tuned on diverse tasks [<xref ref-type="bibr" rid="ref48">48</xref>,<xref ref-type="bibr" rid="ref49">49</xref>], enabling them to follow novel instructions and perform unseen tasks without requiring additional training, a capability known as zero-shot generalization [<xref ref-type="bibr" rid="ref50">50</xref>,<xref ref-type="bibr" rid="ref51">51</xref>]. Prior studies have highlighted the importance of systematic prompt engineering [<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref52">52</xref>], for example, by incorporating annotation guideline instructions. As shown in Figure S2 and Appendix S3 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>, our zero-shot approach used a 3-component system prompt: (1) role-playing instructions to contextualize the task, (2) definitions of SDoH domain categories and subcategories, and (3) step-by-step instructions for extracting SDoH information and structuring the output. The prompt instructed LLMs to follow a hierarchical approach: identify SDoH domain categories first, then their corresponding subcategories, returning “none” if no relevant information was present. We emphasized that only current, patient-specific, and confirmed SDoH information should be extracted, excluding historical, family member, or hypothetical mentions (eg, doctor’s recommendations).</p>
          <p>In addition, we evaluated 3 prompting styles, namely, strict, balanced, and liberal, which differ in their threshold for identifying SDoH domains and subcategories (inclusion criteria). The strict style requires explicit evidence, balanced accepts evidence that is strongly implied, and liberal takes the most inclusive approach, accepting not only explicit and strongly implied evidence but also information deemed reasonably likely from the context. We hypothesized that these styles would demonstrate a precision-recall trade-off, with strict achieving higher precision and liberal yielding higher recall.</p>
        </sec>
        <sec>
          <title>Few-Shot Prompting</title>
          <p>Following Consoli et al [<xref ref-type="bibr" rid="ref14">14</xref>], we tested 6 few-shot prompting strategies using examples from our annotation training: (1) using 5 examples where annotators readily agreed on the correct identification of SDoH information (ie, easy examples); (2) same as (1), but with explanations describing the reasoning behind each annotation; (3) using 5 challenging examples that required annotator adjudication (ie, hard examples); (4) same as (3), but with explanations added; (5) using synthetically generated examples by GPT; and (6) same as (5), but with synthetic explanations. The goal of these experiments was to assess whether advanced GPT models benefit from examples with or without explanations, and whether exposure to difficult, ambiguous, or synthetic cases improves their accuracy and robustness in SDoH extraction. The few-shot prompt structure is illustrated in Figure S3 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p>
        </sec>
      </sec>
      <sec>
        <title>RBS-GPT Ensemble</title>
        <p>Drawing on prior work in LLM ensemble learning within the broader NLP domain [<xref ref-type="bibr" rid="ref53">53</xref>-<xref ref-type="bibr" rid="ref56">56</xref>], we implemented a hybrid ensemble approach that aggregates rule-based and GPT model outputs using late fusion to improve the overall performance of SDoH extraction. Using the annotator training samples as development data, we found that the RBS achieved good precision (0.92) for domain categories but showed poor performance (precision of 0.64) at the subcategory level. Based on these findings, we designed 2 different ensemble strategies (<xref rid="figure4" ref-type="fig">Figure 4</xref>): (1) for domain categories, we deployed the best-performing GPT model with 3 prompting styles (strict, balanced, and liberal) to form a small “GPT committee.” The committee’s outputs were first aggregated and then combined with those from the RBS; (2) for subcategories, we used only the aggregated GPT committee output to determine the final list of SDoH subcategories. We evaluated several ensemble configurations, testing 3 fusion functions for the GPT committee: (1) majority voting, (2) union, and (3) intersection, and compared them with GPT using strict prompting alone. We also examined 2 fusion functions (union and intersection) for combining RBS and GPT committee outputs (RBS-GPT fusion).</p>
        <fig id="figure4" position="float">
          <label>Figure 4</label>
          <caption>
            <p>(A) Overview of the RBS-GPT ensemble workflow, illustrating separate fusion pathways for SDoH domain categories and subcategories. For domain categories, outputs from the RBS and multiple GPT prompts (the GPT committee) are combined using late fusion. For subcategories, only outputs from the GPT committee are aggregated. (B) Illustrative example of the fusion strategies, including majority voting, union, and intersection. RBS: rule-based system; SDoH: social determinants of health.</p>
          </caption>
          <graphic xlink:href="medinform_v14i1e89534_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Gold-Standard Data Annotation</title>
        <p>The final annotated validation dataset consisted of 226 text segments from 171 patients, with a total of 410 SDoH domain-category annotations, including 7 labeled “none of the above,” and 475 subcategory annotations, including 153 labeled “N/A.” <xref ref-type="table" rid="table1">Table 1</xref> summarizes patient demographic characteristics, showing balanced distributions of gender and self-reported race, with a predominance of older patients and those with public health insurance.</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Patient demographics from the annotated validation dataset (N=171).</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="650"/>
            <col width="320"/>
            <thead>
              <tr valign="top">
                <td colspan="2">Characteristics and categories</td>
                <td>Value, n (%)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="2">
                  <bold>Age group (years)</bold>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>&#60;25</td>
                <td>16 (9.4)</td>
              </tr>
              <tr valign="top">
                <td/>
                <td>25-44</td>
                <td>39 (22.8)</td>
              </tr>
              <tr valign="top">
                <td/>
                <td>45-64</td>
                <td>31 (18.1)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>≥65</td>
                <td>85 (49.7)</td>
              </tr>
              <tr valign="top">
                <td colspan="2">
                  <bold>Gender</bold>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Female</td>
                <td>86 (50.3)</td>
              </tr>
              <tr valign="top">
                <td/>
                <td>Male</td>
                <td>85 (49.7)</td>
              </tr>
              <tr valign="top">
                <td colspan="2">
                  <bold>Self-reported race</bold>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Asian</td>
                <td>38 (22.2)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Black/African American</td>
                <td>46 (26.9)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>White</td>
                <td>43 (25.1)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Other</td>
                <td>44 (25.7)</td>
              </tr>
              <tr valign="top">
                <td colspan="2">
                  <bold>Ethnicity</bold>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Hispanic</td>
                <td>17 (9.9)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Non-Hispanic</td>
                <td>154 (90.1)</td>
              </tr>
              <tr valign="top">
                <td colspan="2">
                  <bold>Marital status</bold>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Single</td>
                <td>84 (49.1)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Married</td>
                <td>62 (36.3)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Partner</td>
                <td>1 (0.6)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Divorced</td>
                <td>11 (6.4)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Separated</td>
                <td>2 (1.2)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Widowed</td>
                <td>5 (2.9)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Other/unknown</td>
                <td>6 (3.5)</td>
              </tr>
              <tr valign="top">
                <td colspan="2">
                  <bold>Income level<sup>a</sup></bold>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>&#60;US $40,000</td>
                <td>17 (9.9)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>US $40,000–69,000</td>
                <td>88 (51.5)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>US $70,000–99,000</td>
                <td>46 (26.9)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>≥US $100,000</td>
                <td>17 (9.9)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Unknown</td>
                <td>3 (1.8)</td>
              </tr>
              <tr valign="top">
                <td colspan="2">
                  <bold>Public payer</bold>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Yes</td>
                <td>122 (71.3)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>No</td>
                <td>49 (28.7)</td>
              </tr>
              <tr valign="top">
                <td colspan="2">
                  <bold>Veteran status</bold>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Yes</td>
                <td>4 (2.3)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>No</td>
                <td>152 (88.9)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Unknown</td>
                <td>15 (8.8)</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>Median household income by ZIP code.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>As noted earlier, the 2 annotators achieved strong interannotator agreement (Krippendorff α=.95 for domain categories and .78 for subcategories with attributes). The majority of annotation disagreements for domain categories were attributed to “social resources” (which required a clearer scope definition) and “general financial status” (where 1 annotator [DK] overlooked questionnaire-derived mentions). Similarly, most subcategory-level disagreements stemmed from poorly formatted in-text questionnaires and inconsistencies in identifying contextual attributes of SDoH mentions. For instance, references to public housing applications prompted discussion about whether they should be labeled as “hypothetical” under “subsidized/public housing.” Additionally, annotators needed further guidance to correctly parse question-answer pairs within poorly formatted questionnaire text. Only text segments containing current, patient-specific, and nonhypothetical SDoH information were considered SDoH-positive cases.</p>
      </sec>
      <sec>
        <title>Model Performance</title>
        <sec>
          <title>Comparative Performance of Rule-Based and GPT Models for SDoH Classification</title>
          <p><xref rid="figure5" ref-type="fig">Figure 5</xref> summarizes the macro-averaged performance of the RBS and 5 GPT-based models (additional results in Table S1 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>); 95% CIs for macro- and micro-averaged <italic>F</italic><sub>1</sub>-scores are shown in Figures S4 and S5 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. While the RBS achieved high precision for domain categories, it demonstrated substantially lower recall than GPT-based models across both classification levels, highlighting the inherent limitation of fixed rules. By contrast, GPT-based models consistently outperformed the RBS in recall and <italic>F</italic><sub>1</sub>-scores. At the domain-category level, GPT-5-mini (5-shot) and GPT-5 (5-shot) were tied for the highest point-estimate <italic>F</italic><sub>1</sub>-score (0.89), with precision/recall/<italic>F</italic><sub>1</sub>-score of 0.91/0.87/0.89 (95% CI for <italic>F</italic><sub>1</sub>-score 0.86-0.91) and 0.96/0.84/0.89 (95% CI for <italic>F</italic><sub>1</sub>-score 0.86-0.92), respectively. At the subcategory level, the o4-mini models demonstrated the strongest performance, achieving an <italic>F</italic><sub>1</sub>-score of 0.87 (95% CI 0.83-0.90) in the zero-shot setting (precision, recall, and <italic>F</italic><sub>1</sub>-score of 0.85, 0.91, and 0.87, respectively) and 0.88 (95% CI 0.84-0.91) in the 5-shot setting (0.90, 0.87, and 0.88, respectively). As shown in Figure S5 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>, the 95% CIs overlapped considerably between o4-mini and GPT-5, suggesting that small differences in point estimates should be interpreted cautiously. Overall, few-shot prompting yielded modest gains in precision for subcategories, often accompanied by slight reductions in recall. <xref ref-type="table" rid="table2">Table 2</xref> reports micro-averaged metrics and absolute error counts (false positives and false negatives) for subcategories (additional results in Table S2 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). Consistent with the macro-averaged results, o4-mini remained the best overall subcategory model, with o4-mini (5-shot) achieving the highest micro-averaged <italic>F</italic><sub>1</sub>-score (0.88; 95% CI 0.85-0.91; true positive, false positive, and false negative of 283, 37, and 39, respectively). GPT-5-mini (zero-shot) achieved the highest recall (0.93) and the largest number of true positives (298), but at the cost of more false positives (100).</p>
          <fig id="figure5" position="float">
            <label>Figure 5</label>
            <caption>
              <p>Overall performance comparison between rule-based system (RBS) and GPT-based approaches. Macro-averaged precision, recall, and <italic>F</italic><sub>1</sub>-score are reported separately for domain categories and subcategories. The corresponding 95% CIs for macro-<italic>F</italic><sub>1</sub>-score are shown in Figures S4 and S5 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. All reasoning models reported here (o4-mini, GPT-5-mini, and GPT-5) were run using the high-reasoning setting. The highest score in each metric column is highlighted with a blue box border. SDoH: social determinants of health.</p>
            </caption>
            <graphic xlink:href="medinform_v14i1e89534_fig5.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
          <table-wrap position="float" id="table2">
            <label>Table 2</label>
            <caption>
              <p>Micro-averaged performance metrics and absolute error counts for subcategories<sup>a,b</sup>.</p>
            </caption>
            <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
              <col width="200"/>
              <col width="100"/>
              <col width="90"/>
              <col width="90"/>
              <col width="170"/>
              <col width="150"/>
              <col width="200"/>
              <thead>
                <tr valign="top">
                  <td>Models</td>
                  <td>Precision</td>
                  <td>Recall</td>
                  <td><italic>F</italic><sub>1</sub>-score</td>
                  <td>True positive, n</td>
                  <td>False positive, n</td>
                  <td>False negative, n</td>
                </tr>
              </thead>
              <tbody>
                <tr valign="top">
                  <td>Rule-based system</td>
                  <td>0.67</td>
                  <td>0.49</td>
                  <td>0.57</td>
                  <td>159</td>
                  <td>79</td>
                  <td>163</td>
                </tr>
                <tr valign="top">
                  <td>GPT-4o (zero-shot)</td>
                  <td>0.77</td>
                  <td>0.85</td>
                  <td>0.81</td>
                  <td>274</td>
                  <td>83</td>
                  <td>48</td>
                </tr>
                <tr valign="top">
                  <td>GPT-4o (5-shot)</td>
                  <td>0.82</td>
                  <td>0.84</td>
                  <td>0.83</td>
                  <td>272</td>
                  <td>58</td>
                  <td>50</td>
                </tr>
                <tr valign="top">
                  <td>GPT-4.1 (zero-shot)</td>
                  <td>0.79</td>
                  <td>0.85</td>
                  <td>0.82</td>
                  <td>275</td>
                  <td>75</td>
                  <td>47</td>
                </tr>
                <tr valign="top">
                  <td>GPT-4.1 (5-shot)</td>
                  <td>0.84</td>
                  <td>0.83</td>
                  <td>0.83</td>
                  <td>266</td>
                  <td>50</td>
                  <td>56</td>
                </tr>
                <tr valign="top">
                  <td>o4-mini (zero-shot)</td>
                  <td>0.84</td>
                  <td>0.90</td>
                  <td>0.87</td>
                  <td>289</td>
                  <td>55</td>
                  <td>33</td>
                </tr>
                <tr valign="top">
                  <td>o4-mini (5-shot)</td>
                  <td>0.88</td>
                  <td>0.88</td>
                  <td>0.88</td>
                  <td>283</td>
                  <td>37</td>
                  <td>39</td>
                </tr>
                <tr valign="top">
                  <td>GPT-5-mini (zero-shot)</td>
                  <td>0.75</td>
                  <td>0.93</td>
                  <td>0.83</td>
                  <td>298</td>
                  <td>100</td>
                  <td>24</td>
                </tr>
                <tr valign="top">
                  <td>GPT-5-mini (5-shot)</td>
                  <td>0.79</td>
                  <td>0.90</td>
                  <td>0.84</td>
                  <td>289</td>
                  <td>78</td>
                  <td>33</td>
                </tr>
                <tr valign="top">
                  <td>GPT-5 (zero-shot)</td>
                  <td>0.84</td>
                  <td>0.88</td>
                  <td>0.86</td>
                  <td>282</td>
                  <td>54</td>
                  <td>40</td>
                </tr>
                <tr valign="top">
                  <td>GPT-5 (5-shot)</td>
                  <td>0.88</td>
                  <td>0.84</td>
                  <td>0.86</td>
                  <td>272</td>
                  <td>37</td>
                  <td>50</td>
                </tr>
              </tbody>
            </table>
            <table-wrap-foot>
              <fn id="table2fn1">
                <p><sup>a</sup>Absolute counts denote true positives, false positives, and false negatives relative to gold-standard annotations.</p>
              </fn>
              <fn id="table2fn2">
                <p><sup>b</sup>True positive + false negative sums to 322 rather than the 475 total annotations because 153 annotations labeled “NA” do not contribute to true positive or false negative for any positive subcategory label.</p>
              </fn>
            </table-wrap-foot>
          </table-wrap>
          <p>Appendix S5 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> benchmarks the inference time (client wall-clock) and cost across o4-mini, GPT-5-mini, and GPT-5 under a high-reasoning setting, using a single-worker sequential deployment. While both mini models performed competitively with GPT-5, they demonstrated substantially lower inference latency and estimated per-segment cost. For example, o4-mini required approximately 7.0 seconds per segment in zero-shot and 8.9 seconds in 5-shot prompting, compared with 33.0 and 34.6 seconds, respectively, for GPT-5. API-reported reasoning tokens accounted for most completion tokens across models (94%-98%; see Appendix S5 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>), reflecting the computational overhead of chain-of-thought processing. Based on cost efficiency and competitive performance at both levels, as demonstrated in the per-domain and per-subcategory results (Table S3 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>), we selected o4-mini (5-shot) as our primary model for further experiments involving ensemble modeling.</p>
        </sec>
        <sec>
          <title>Prompting Comparison</title>
          <p>Among the strict, balanced, and liberal prompting styles, we observed the anticipated precision-recall trade-off (Table S4 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>): strict prompting achieved the highest precision and <italic>F</italic><sub>1</sub>-scores for subcategories in both zero-shot and 5-shot settings, while liberal prompting had the best recall, and balanced prompting yielded intermediate results.</p>
          <p>Performance varied modestly across example types (easy, hard, or synthetic), with <italic>F</italic><sub>1</sub>-scores ranging from 0.81 to 0.86 for domain categories and 0.87 to 0.88 for subcategories (Table S5 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). Hard examples requiring annotator adjudication yielded better performance for subcategories, particularly in precision (0.90 vs 0.86 for easy examples and 0.88 for synthetic examples). Adding explanations to the prompt improved precision for subcategories in the hard-example model (from 0.88 to 0.90) but had little impact on other models or metrics.</p>
        </sec>
        <sec>
          <title>Ensemble Performance</title>
          <p>As described in the “Methods” section, we used different ensemble strategies by classification level: 2-step fusion for domain categories and GPT-committee ensembling for subcategories. As shown in <xref ref-type="table" rid="table3">Table 3</xref>, majority voting on GPT-committee outputs followed by union (∪) with RBS outputs achieved the highest macro-averaged <italic>F</italic><sub>1</sub>-score (0.92; 95% CI 0.89-0.94) and the most balanced performance for domain categories, with precision above 0.93 and recall above 0.90. However, the overlapping CIs suggest that performance differences among top fusion strategies should be interpreted cautiously. Of the 402 domain-category predictions produced (of which 21 were “none of the above”), 32 (8.0%) were contributed by the RBS alone, demonstrating its added value; 140 (34.8%) came from the GPT committee, indicating its ability to capture patterns missed by the RBS; and the remaining 230 (57.2%) were identified by both systems. For subcategories, the strict-only configuration achieved the best performance (precision of 0.90, recall of 0.87, <italic>F</italic><sub>1</sub>-score=0.88; 95% CI 0.84-0.91), consistent with our objective of maximizing <italic>F</italic><sub>1</sub>-score with balanced precision and recall. The intersection configuration followed closely, achieving an <italic>F</italic><sub>1</sub>-score of 0.87, with higher precision (0.92) but lower recall (0.84). Micro-averaged results and absolute error counts are reported in Table S15 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> and showed a similar overall pattern.</p>
          <table-wrap position="float" id="table3">
            <label>Table 3</label>
            <caption>
              <p>Performance of ensemble models across fusion strategies<sup>a,b</sup>.</p>
            </caption>
            <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
              <col width="30"/>
              <col width="210"/>
              <col width="180"/>
              <col width="200"/>
              <col width="180"/>
              <col width="200"/>
              <thead>
                <tr valign="bottom">
                  <td colspan="2">SDoH<sup>c</sup> label level and GPT-committee</td>
                  <td>RBS<sup>d</sup>-GPT fusion</td>
                  <td>Precision (95% CI)</td>
                  <td>Recall (95% CI)</td>
                  <td><italic>F</italic><sub>1</sub>-score (95% CI)</td>
                </tr>
              </thead>
              <tbody>
                <tr valign="top">
                  <td colspan="2">
                    <bold>Domain categories</bold>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Majority voting</td>
                  <td>∪</td>
                  <td>0.93 (0.90-0.96)</td>
                  <td>0.90 (0.87-0.93)</td>
                  <td><italic>0.92</italic> (0.89-0.94)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Majority voting</td>
                  <td>∩</td>
                  <td><italic>0.99</italic> (0.98-1.00)</td>
                  <td>0.60 (0.55-0.66)</td>
                  <td>0.74 (0.70-0.78)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Union</td>
                  <td>∪</td>
                  <td>0.89 (0.85-0.92)</td>
                  <td><italic>0.93</italic> (0.90-0.96)</td>
                  <td>0.91 (0.88-0.93)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Union</td>
                  <td>∩</td>
                  <td><italic>0.99</italic> (0.97-1.00)</td>
                  <td>0.63 (0.58-0.68)</td>
                  <td>0.76 (0.72-0.80)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Intersection</td>
                  <td>∪</td>
                  <td>0.95 (0.92-0.98)</td>
                  <td>0.85 (0.81-0.89)</td>
                  <td>0.90 (0.87-0.92)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Intersection</td>
                  <td>∩</td>
                  <td><italic>0.99</italic> (0.98-1.00)</td>
                  <td>0.55 (0.49-0.60)</td>
                  <td>0.70 (0.65-0.74)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Strict-only</td>
                  <td>∪</td>
                  <td>0.95 (0.92-0.98)</td>
                  <td>0.88 (0.84-0.91)</td>
                  <td>0.91 (0.88-0.93)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Strict-only</td>
                  <td>∩</td>
                  <td><italic>0.99</italic> (0.98-1.00)</td>
                  <td>0.56 (0.51-0.62)</td>
                  <td>0.71 (0.67-0.76)</td>
                </tr>
                <tr valign="top">
                  <td colspan="2">
                    <bold>Subcategories</bold>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Majority voting</td>
                  <td>N/A<sup>e</sup></td>
                  <td>0.85 (0.82-0.89)</td>
                  <td>0.91 (0.87-0.94)</td>
                  <td>0.87 (0.84-0.90)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Union</td>
                  <td>N/A</td>
                  <td>0.73 (0.69-0.78)</td>
                  <td><italic>0.95</italic> (0.92-0.97)</td>
                  <td>0.82 (0.78-0.84)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Intersection</td>
                  <td>N/A</td>
                  <td><italic>0.92</italic> (0.89-0.95)</td>
                  <td>0.84 (0.79-0.88)</td>
                  <td>0.87 (0.83-0.90)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Strict-only</td>
                  <td>N/A</td>
                  <td>0.90 (0.87-0.94)</td>
                  <td>0.87 (0.83-0.91)</td>
                  <td><italic>0.88</italic> (0.84-0.91)</td>
                </tr>
              </tbody>
            </table>
            <table-wrap-foot>
              <fn id="table3fn1">
                <p><sup>a</sup>Macro-averaged precision, recall, and <italic>F</italic><sub>1</sub>-scores are reported for domain categories and subcategories. Majority voting, union, and intersection denote label assignment by most, any, or all GPT committee members, respectively. Strict-only uses the strict-prompt GPT output without aggregation. For domain categories, ∪ denotes assignment by either RBS or the GPT committee, and ∩ denotes assignment by both. 95% CIs were computed using 2000 patient-level cluster bootstrap resamples.</p>
              </fn>
              <fn id="table3fn2">
                <p><sup>b</sup>The highest scores for each metric (column) are italicized.</p>
              </fn>
              <fn id="table3fn3">
                <p><sup>c</sup>SDoH: social determinants of health.</p>
              </fn>
              <fn id="table3fn4">
                <p><sup>d</sup>RBS: rule-based system.</p>
              </fn>
              <fn id="table3fn5">
                <p><sup>e</sup>For subcategories, RBS-GPT fusion was not applied; N/A (not applicable) indicates GPT-committee ensembling only.</p>
              </fn>
            </table-wrap-foot>
          </table-wrap>
        </sec>
        <sec>
          <title>Comparison With International Classification of Diseases (ICD) Codes</title>
          <p>Both the RBS and GPT models identified substantially more SDoH information than documentation based on ICD (International Classification of Diseases) codes (V and Z codes). Of the 226 annotated samples, our RBS identified SDoH information in 225, and the 5-shot GPT models identified SDoH in 194 (o4-mini), 219 (GPT-5-mini), and 206 (GPT-5) cases. In comparison, relevant ICD codes were present in far fewer visits across all 3 time windows examined: using broad Z and V codes (see Table S12 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>), matches were found in 84 visits within 7 days of the corresponding clinical documentation, 128 visits within a 6-month lookback window, and 133 visits within a 12-month lookback window. Using SDoH category–specific Z and V codes (see Table S13 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>), matches were found in only 11, 12, and 14 visits for the same time windows, respectively. These findings highlight the value of extracting SDoH from clinical text, as structured ICD coding substantially undercaptures SDoH information even when extended lookback periods are used.</p>
        </sec>
        <sec>
          <title>Error Analysis</title>
          <p>To better understand model limitations beyond quantitative performance metrics, we conducted a qualitative review of false-positive and false-negative predictions from the o4-mini (5-shot) model and the RBS at both the domain and subcategory levels. Owing to its lack of semantic understanding, the RBS failed to capture many SDoH mentions that fell outside its predefined keyword rules. For example, it was unable to recognize that “patient owns multiple homes” indicates secure housing. Its finite vocabulary coverage also meant that domain-specific terms such as “Section 8” (a government-funded rent subsidy program) went unrecognized. The majority of the RBS’s false positives stemmed from its failure to correctly recognize negations, temporality, hypotheticals, and experiencer attribution, which were annotated as contextual attributes in our validation data, as well as its inability to perform semantic disambiguation. Table S14 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> summarizes the primary error types for both approaches.</p>
          <p>In contrast to the RBS, o4-mini demonstrated its ability to interpret semantic meaning and generalize beyond keyword matching. However, it exhibited a different set of errors related to reasoning calibration, evidence evaluation, and instruction adherence. These errors can be classified into 4 primary categories (<xref ref-type="boxed-text" rid="box1">Textbox 1</xref>).</p>
          <boxed-text id="box1" position="float">
            <title>Error classification.</title>
            <p>1. Missing implicit evidence</p>
            <p>Under the strict prompting style adopted for subsequent analyses, o4-mini at times failed to infer social determinants of health (SDoH) subcategories that were implied but not explicitly stated.</p>
            <p>2. Overinterpretation of insufficient evidence</p>
            <p>Conversely, the model also exhibited over-reasoning, assigning labels when the evidence was directionally relevant but fell short of what the annotation guidelines require.</p>
            <p>3. Prompt instruction nonadherence</p>
            <p>In several cases, the model failed to follow explicit SDoH definitions provided in the prompt.</p>
            <p>4. Temporality misclassification</p>
            <p>The model occasionally correctly identified an SDoH mention but failed to determine whether it reflected the patient’s current or historical status.</p>
          </boxed-text>
          <p>The first 2 error types reflect a gap between the model and human annotators regarding what constitutes sufficient evidence for SDoH classification, suggesting that the model lacks a calibrated threshold aligned with the annotation framework. Future efforts should focus on closing this gap through refined SDoH definitions and boundary-clarifying examples.</p>
        </sec>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>This study examined the extraction of SDoH information across 7 domain categories, including less-studied domains such as social resources and health insurance status, and 23 corresponding subcategories from discharge summaries and progress notes in a large health system. We evaluated 7 GPT models under multiple prompting strategies and compared their performance with an expert-designed, iteratively optimized RBS. Recently released GPT models with improved reasoning capabilities, such as GPT-5 and o4-mini, achieved the best overall performance at both the domain category and subcategory levels. While the RBS demonstrated high precision for domain categories, it exhibited consistently low recall because of the inherent rigidity of manually engineered rules. For example, GPT models correctly identified “patient needs WIC” (where WIC refers to the Women, Infants, &#38; Children Nutrition Program) as an indicator of “food insecurity” by recognizing WIC’s role as a food assistance program, while appropriately excluding gastrointestinal-related eating difficulties as medical rather than socioeconomic issues. By contrast, the RBS failed to capture the WIC reference because it relied on predefined lexicons and misclassified gastrointestinal-related eating problems as food insecurity, lacking the semantic understanding to distinguish medical from social determinants. Our findings differ from Patra et al [<xref ref-type="bibr" rid="ref17">17</xref>], who reported superior RBS performance over an LLM-based approach for classifying social support and social isolation, primarily because their RBS closely mirrored the gold-standard annotation rule book, leading to overfitting.</p>
        <p>Focusing on our GPT models, the domain-level macro-<italic>F</italic><sub>1</sub>-scores of 0.82-0.89 are broadly consistent with recent evaluations of LLM-based SDoH extraction [<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref15">15</xref>]. For example, Keloth et al [<xref ref-type="bibr" rid="ref15">15</xref>] reported macro-<italic>F</italic><sub>1</sub>-scores ranging from 0.53 to 0.84 across 4 institutions using instruction fine-tuned LLaMA models, while Guevara et al [<xref ref-type="bibr" rid="ref13">13</xref>] achieved a macro-<italic>F</italic><sub>1</sub>-score of 0.71 for sentence-level SDoH classification using fine-tuned Flan-T5 models. At the subcategory level, our GPT models achieved macro-<italic>F</italic><sub>1</sub>-scores of 0.78-0.88 across 23 subcategories. By contrast, Keloth et al [<xref ref-type="bibr" rid="ref15">15</xref>] reported lower level-2 macro-<italic>F</italic><sub>1</sub>-scores (0.45-0.59), although their task additionally required temporality determination for some categories. Earlier-generation LLMs have shown more limited in-context learning performance, with GPT-4 one-shot prompting achieving only 0.65 micro-averaged <italic>F</italic><sub>1</sub>-score on the n2c2/UW SHAC event extraction task [<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref57">57</xref>], and few-shot–prompted LLaMA-2 underperforming fine-tuned models [<xref ref-type="bibr" rid="ref15">15</xref>]. While these comparisons should be interpreted with caution because of differences in SDoH taxonomies, annotation schemas, note types, evaluation metrics, and the enriched nature of our validation set, the overall pattern suggests that recent reasoning-capable GPT models, when applied to prescreened clinical text in prompted settings, can achieve performance comparable to that reported for fine-tuned approaches and represent a meaningful advance over earlier LLM prompting-based models. Additional evaluation on 500 unfiltered text segments, drawn from notes with a median documentation year of 2014 (IQR 2010-2018), showed low false-positive rates and provided preliminary evidence that the model can identify SDoH concepts in unfiltered clinical text, although the small number of SDoH-positive cases (n=42) precludes definitive conclusions about broader generalizability (see Appendix S7 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>).</p>
        <p>Comparing efficiency in model development, GPT-based approaches in zero-shot or few-shot settings required substantially less development time and cost than constructing the RBS, which involved iterative rule creation and refinement. Among the GPT models, newer “mini” models, such as GPT-5-mini and o4-mini, which retain reasoning capabilities, performed competitively with OpenAI’s flagship GPT-5 model while demonstrating substantially lower inference costs and latency. In our benchmarking (Appendix S5 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>), o4-mini (5-shot) and GPT-5-mini (5-shot) incurred estimated costs of US $0.008 and US $0.005 per text segment, respectively, compared with US $0.029 for GPT-5 (5-shot), representing 72%-82% cost reductions. By contrast, earlier small models such as GPT-4o-mini and GPT-4.1-mini, although offering even lower per-token pricing, did not perform on par with their respective full models. At the observed single-worker throughput for o4-mini (5-shot), processing 100,000 and 1,000,000 segments would require approximately 10 and 102 days, respectively. In practice, cloud providers offer asynchronous batch processing with higher rate-limit pools and a 50% cost discount, which could substantially reduce wall-clock time relative to sequential single-worker deployment. However, realized throughput remains subject to API quotas, particularly for reasoning models such as o4-mini, whose hidden reasoning tokens increase token consumption. Alternatively, LLM-generated annotations on a representative subset could be used to train a local classifier, reducing API dependence for large-scale deployment.</p>
        <p>Our prompt engineering evaluation highlighted the sensitivity of model performance to prompt wording, showing a precision-recall trade-off that can be tuned through stricter or more liberal prompt styles. For few-shot prompting, when comparing the addition of different types of examples, we found that including cases in which annotators required clarification or adjudication, along with explanations, yielded optimal performance for SDoH subcategories, suggesting the value of exposing LLMs to examples that humans themselves found challenging and ambiguous. For example, to improve GPT models’ ability to parse questionnaire text, we provided examples demonstrating how to identify question-answer pairs and when to recognize missing answers, in which case no subcategory should be assigned. Taken together, these findings suggest that adopting a systematic approach to prompt design and incorporating challenging examples should be considered best practices for LLM-based extraction methods.</p>
        <p>Lastly, we evaluated various model ensemble strategies using late fusion. Combining the RBS with a committee of GPT models employing different prompting styles improved domain-category extraction compared with using GPT models alone. For example, the RBS-GPT hybrid correctly recognized “involved in church community” as a mention of “social resource,” whereas the GPT models alone failed to do so. For subcategories, the GPT committee demonstrated that precision or recall could be selectively improved depending on the fusion function applied, though without an overall performance gain. These findings suggest the complementary strengths of rule- and LLM-based systems, although the contribution of the RBS to the ensemble for domain category extraction may be inflated by the keyword-enriched validation set. The lack of improvement at the subcategory level also indicates the need for more advanced and adaptive ensemble strategies, such as mixture-of-experts approaches in which different models (experts) handle different inputs, a direction for future investigation.</p>
      </sec>
      <sec>
        <title>Limitations and Future Directions</title>
        <p>This study has several limitations. First, both our RBS and GPT-based models were validated in a single health care system, and performance may vary elsewhere depending on documentation practices. This concern may be particularly relevant for the RBS, whose lexicon was filtered and refined through manual review of MGB notes and may therefore be less generalizable to other health systems. Additionally, because the validation set was sampled from the same source corpus, the reported RBS performance may represent an optimistic upper bound in this setting. At the same time, MGB comprises more than 8 hospitals and multiple community health centers with heterogeneous catchment areas and clinical practices, supporting some degree of generalizability. Second, our primary goal was to develop a cost-efficient SDoH extraction pipeline for resource-constrained settings, which motivated our focus on rule-based and LLM prompting–based approaches that can be deployed with minimal annotation effort and computational resources. We did not explore the use of synthetic data generation for training supervised models or LLM fine-tuning, which, while potentially reducing annotation cost, still requires computation for model training. Future work could examine how these approaches compare. Third, although recent GPT models are considered state of the art for many tasks, particularly those requiring reasoning capabilities, we did not conduct a systematic comparison with open-weight LLMs. Such an evaluation would provide a more complete performance assessment. Fourth, we annotated text segments rather than entire clinical notes, as manual review suggested that segments contained sufficient information for SDoH extraction. However, this approach may miss SDoH mentions that depend on long-distance context within full notes. Fifth, although exploratory analyses stratified by gender, self-reported race, and ethnicity did not detect statistically significant performance differences across demographic subgroups for o4-mini or the RBS (see Appendix S6 and Tables S6-S11 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>), small subgroup sizes substantially limited statistical power. These results should not be interpreted as evidence that the models are free of demographic bias, and a larger, more demographically balanced dataset is needed for robust subgroup evaluation. Finally, because we applied rule-based filtering during data sampling, the recall and <italic>F</italic><sub>1</sub>-scores reported from our primary validation set are based on enriched text and therefore do not fully reflect performance in the general population of clinical notes. Although an additional evaluation on 500 unfiltered text segments (Appendix S7 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>) suggested that model performance generalizes beyond the enriched setting, the limited number of SDoH-positive cases in unfiltered text prevents definitive conclusions about generalizability and warrants further validation on larger, independently sampled datasets.</p>
        <p>The ability to accurately and efficiently extract SDoH factors from clinical notes has important implications for health care systems, as such information is often underdocumented in structured EHR data. Our approach provides a cost-efficient method for SDoH extraction, demonstrating consistently high precision and recall across both domain categories and subcategories. By prescreening clinical notes with a rule-based NLP filter to identify relevant text segments before applying LLM-based extraction, we improved efficiency and substantially reduced computational costs compared with processing entire patient notes directly with LLMs. The approach presented in this study has the potential to advance important population health research and ultimately inform clinical outcomes and evidence-based policy intervention [<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref58">58</xref>]. Incorporating SDoH information into clinical prediction models is expected to improve prediction performance, as recent studies suggest [<xref ref-type="bibr" rid="ref59">59</xref>,<xref ref-type="bibr" rid="ref60">60</xref>], while also supporting audits of algorithmic biases beyond traditional demographic variables [<xref ref-type="bibr" rid="ref61">61</xref>]. Finally, as interest grows in implementing such NLP systems in clinical operations, it will be critical to anticipate and mitigate potential unintended consequences of automated SDoH extraction for patients [<xref ref-type="bibr" rid="ref62">62</xref>].</p>
        <p>Future work should assess the robustness and generalizability of our approach to other health care systems, especially those with very different clinical settings, patient demographics, and socioeconomic environments. Furthermore, social determinants are highly context-dependent. Existing models often categorize a patient’s social circumstances into predefined labels without capturing context, limiting their ability to provide a comprehensive and contextually relevant understanding of the patient’s social needs. Lybarger et al [<xref ref-type="bibr" rid="ref21">21</xref>] used an event-based annotation scheme characterizing each SDoH mention with multiple arguments (eg, employment status, duration, history, and type for “employment”) from the social history sections. We plan to explore methods for incorporating richer contextual information, moving beyond the contextual attributes used in our rule-based approach and related work [<xref ref-type="bibr" rid="ref5">5</xref>,<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref21">21</xref>]. We will investigate text summarization methods to generate structured representations that encapsulate a comprehensive profile of a patient’s SDoH status for each clinical encounter. Lastly, it will also be important to validate the utility of the extracted SDoH information, along with community-level socioeconomic factors [<xref ref-type="bibr" rid="ref58">58</xref>], in supporting downstream health research applications, including suicide prediction [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref60">60</xref>,<xref ref-type="bibr" rid="ref63">63</xref>] and model auditing [<xref ref-type="bibr" rid="ref61">61</xref>,<xref ref-type="bibr" rid="ref64">64</xref>].</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>This study presented and compared 2 NLP approaches, an RBS and a GPT-based model, for extracting SDoH information from clinical text segments retrieved from clinical notes. Recent GPT models with advanced reasoning capabilities achieved superior performance in identifying 7 SDoH domain categories and 23 subcategories with high precision and recall, requiring no additional training or fine-tuning. In addition, we developed and validated late-fusion ensembles combining both approaches to optimize extraction performance. By making our code and prompts available to the scientific community, we provide a cost-efficient solution for accurate SDoH extraction, with the potential to advance important downstream health research applications.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Supplementary materials.</p>
        <media xlink:href="medinform_v14i1e89534_app1.docx" xlink:title="DOCX File , 7266 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">API</term>
          <def>
            <p>application programming interface</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">BERT</term>
          <def>
            <p>Bidirectional Encoder Representations from Transformers</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">EHR</term>
          <def>
            <p>electronic health record</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">FLAN-T5</term>
          <def>
            <p>Fine-Tuned Language Net—Text-to-Text Transfer Transformer</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">HIPAA</term>
          <def>
            <p>Health Insurance Portability and Accountability Act</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">ICD</term>
          <def>
            <p>International Classification of Diseases</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">LLaMA</term>
          <def>
            <p>Large Language Model Meta AI</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">LLM</term>
          <def>
            <p>large language model</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb9">MGB</term>
          <def>
            <p>Mass General Brigham</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb10">NLP</term>
          <def>
            <p>natural language processing</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb11">RBS</term>
          <def>
            <p>rule-based system</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb12">RPDR</term>
          <def>
            <p>Research Patient Data Registry</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb13">SDoH</term>
          <def>
            <p>social determinants of health</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb14">UMLS</term>
          <def>
            <p>Unified Medical Language System</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb15">WIC</term>
          <def>
            <p>Women, Infants, &#38; Children Nutrition Program</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>We declare the use of the generative artificial intelligence tool ChatGPT (OpenAI) for language editing and formatting of the manuscript.</p>
    </ack>
    <notes>
      <title>Data Availability</title>
      <p>Protected Health Information restrictions apply to the availability of the clinical data used here, which were accessed under IRB approval for use only in this study. As a result, this dataset is not publicly available. The code for our rule-based system and LLM prompts is available online [<xref ref-type="bibr" rid="ref45">45</xref>].</p>
    </notes>
    <notes>
      <title>Funding</title>
      <p>This work was supported in part by funding from the Brain and Behavior Research Foundation Young Investigator Award (BW) and the NIMH (grants P50MH129699, R01MH118233, and R01MH137218 to JWS, and K08MH127413 to KWC).</p>
    </notes>
    <fn-group>
      <fn fn-type="con">
        <p>Conceptualization: BW, KWC, JWS</p>
        <p>Data curation: BW, DK</p>
        <p>Formal analysis: BW</p>
        <p>Funding acquisition: BW, JWS</p>
        <p>Investigation: BW, KWC, JWS</p>
        <p>Methodology: BW, KWC, JWS, DK, CRC</p>
        <p>Project administration: BW</p>
        <p>Resources: KWC, JWS</p>
        <p>Supervision: KWC, JWS</p>
        <p>Validation: BW, DK</p>
        <p>Visualization: BW</p>
        <p>Writing – original draft: BW</p>
        <p>Writing – review &#38; editing: BW, DK, CRC, KWC, JWS</p>
      </fn>
      <fn fn-type="conflict">
        <p>JWS reports grants from Biogen, Inc, and serves as a scientific advisory board member with options from Sensorium Therapeutics, Inc, outside the submitted work. KWC is a paid consultant and a member of the Mind Advisory Committee of Sword Health. No other disclosures were reported.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="web">
          <article-title>Social determinants of health</article-title>
          <source>World Health Organization (WHO)</source>
          <access-date>2024-02-21</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.who.int/health-topics/social-determinants-of-health">https://www.who.int/health-topics/social-determinants-of-health</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Patra</surname>
              <given-names>BG</given-names>
            </name>
            <name name-style="western">
              <surname>Sharma</surname>
              <given-names>MM</given-names>
            </name>
            <name name-style="western">
              <surname>Vekaria</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Adekkanattu</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Patterson</surname>
              <given-names>OV</given-names>
            </name>
            <name name-style="western">
              <surname>Glicksberg</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Lepow</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Ryu</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Biernacka</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Furmanchuk</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>George</surname>
              <given-names>TJ</given-names>
            </name>
            <name name-style="western">
              <surname>Hogan</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Bian</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Weissman</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Wickramaratne</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Mann</surname>
              <given-names>JJ</given-names>
            </name>
            <name name-style="western">
              <surname>Olfson</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Campion</surname>
              <given-names>TR</given-names>
            </name>
            <name name-style="western">
              <surname>Weiner</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Pathak</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Extracting social determinants of health from electronic health records using natural language processing: a systematic review</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2021</year>
          <month>11</month>
          <day>25</day>
          <volume>28</volume>
          <issue>12</issue>
          <fpage>2716</fpage>
          <lpage>2727</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/34613399"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamia/ocab170</pub-id>
          <pub-id pub-id-type="medline">34613399</pub-id>
          <pub-id pub-id-type="pii">6382241</pub-id>
          <pub-id pub-id-type="pmcid">PMC8633615</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Han</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>RF</given-names>
            </name>
            <name name-style="western">
              <surname>Shi</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Richie</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Tseng</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Quan</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Ryan</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Brent</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Tsui</surname>
              <given-names>FR</given-names>
            </name>
          </person-group>
          <article-title>Classifying social determinants of health from unstructured electronic health records using deep learning-based natural language processing</article-title>
          <source>J Biomed Inform</source>
          <year>2022</year>
          <month>03</month>
          <volume>127</volume>
          <fpage>103984</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(21)00313-0"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2021.103984</pub-id>
          <pub-id pub-id-type="medline">35007754</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(21)00313-0</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mehta</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Lyles</surname>
              <given-names>CR</given-names>
            </name>
            <name name-style="western">
              <surname>Rubinsky</surname>
              <given-names>AD</given-names>
            </name>
            <name name-style="western">
              <surname>Kemper</surname>
              <given-names>KE</given-names>
            </name>
            <name name-style="western">
              <surname>Auerbach</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Sarkar</surname>
              <given-names>U</given-names>
            </name>
            <name name-style="western">
              <surname>Gottlieb</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Brown Iii</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>Social determinants of health documentation in structured and unstructured clinical data of patients with diabetes: comparative analysis</article-title>
          <source>JMIR Med Inform</source>
          <year>2023</year>
          <month>08</month>
          <day>22</day>
          <volume>11</volume>
          <fpage>e46159</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2023//e46159/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/46159</pub-id>
          <pub-id pub-id-type="medline">37621203</pub-id>
          <pub-id pub-id-type="pii">v11i1e46159</pub-id>
          <pub-id pub-id-type="pmcid">PMC10466443</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chapman</surname>
              <given-names>AB</given-names>
            </name>
            <name name-style="western">
              <surname>Jones</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Kelley</surname>
              <given-names>AT</given-names>
            </name>
            <name name-style="western">
              <surname>Jones</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Gawron</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Montgomery</surname>
              <given-names>AE</given-names>
            </name>
            <name name-style="western">
              <surname>Byrne</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Suo</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Cook</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Pettey</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Peterson</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Jones</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Nelson</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>ReHouSED: a novel measurement of Veteran housing stability using natural language processing</article-title>
          <source>J Biomed Inform</source>
          <year>2021</year>
          <month>10</month>
          <volume>122</volume>
          <fpage>103903</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(21)00232-X"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2021.103903</pub-id>
          <pub-id pub-id-type="medline">34474188</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(21)00232-X</pub-id>
          <pub-id pub-id-type="pmcid">PMC8608249</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bejan</surname>
              <given-names>CA</given-names>
            </name>
            <name name-style="western">
              <surname>Angiolillo</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Conway</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Nash</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Shirey-Rice</surname>
              <given-names>JK</given-names>
            </name>
            <name name-style="western">
              <surname>Lipworth</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Cronin</surname>
              <given-names>RM</given-names>
            </name>
            <name name-style="western">
              <surname>Pulley</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kripalani</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Barkin</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>KB</given-names>
            </name>
            <name name-style="western">
              <surname>Denny</surname>
              <given-names>JC</given-names>
            </name>
          </person-group>
          <article-title>Mining 100 million notes to find homelessness and adverse childhood experiences: 2 case studies of rare and severe social determinants of health in electronic health records</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2018</year>
          <month>01</month>
          <day>01</day>
          <volume>25</volume>
          <issue>1</issue>
          <fpage>61</fpage>
          <lpage>71</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/29016793"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamia/ocx059</pub-id>
          <pub-id pub-id-type="medline">29016793</pub-id>
          <pub-id pub-id-type="pii">3940211</pub-id>
          <pub-id pub-id-type="pmcid">PMC6080810</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Conway</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Keyhani</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Christensen</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>South</surname>
              <given-names>BR</given-names>
            </name>
            <name name-style="western">
              <surname>Vali</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Walter</surname>
              <given-names>LC</given-names>
            </name>
            <name name-style="western">
              <surname>Mowery</surname>
              <given-names>DL</given-names>
            </name>
            <name name-style="western">
              <surname>Abdelrahman</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Chapman</surname>
              <given-names>WW</given-names>
            </name>
          </person-group>
          <article-title>Moonstone: a novel natural language processing system for inferring social risk from clinical narratives</article-title>
          <source>J Biomed Semantics</source>
          <year>2019</year>
          <month>04</month>
          <day>11</day>
          <volume>10</volume>
          <issue>1</issue>
          <fpage>6</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://jbiomedsem.biomedcentral.com/articles/10.1186/s13326-019-0198-0"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s13326-019-0198-0</pub-id>
          <pub-id pub-id-type="medline">30975223</pub-id>
          <pub-id pub-id-type="pii">10.1186/s13326-019-0198-0</pub-id>
          <pub-id pub-id-type="pmcid">PMC6458709</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>VJ</given-names>
            </name>
            <name name-style="western">
              <surname>Lenert</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Bunnell</surname>
              <given-names>BE</given-names>
            </name>
            <name name-style="western">
              <surname>Obeid</surname>
              <given-names>JS</given-names>
            </name>
            <name name-style="western">
              <surname>Jefferson</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Halbert</surname>
              <given-names>CH</given-names>
            </name>
          </person-group>
          <article-title>Automatically identifying social isolation from clinical narratives for patients with prostate cancer</article-title>
          <source>BMC Med Inform Decis Mak</source>
          <year>2019</year>
          <month>03</month>
          <day>14</day>
          <volume>19</volume>
          <issue>1</issue>
          <fpage>43</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedinformdecismak.biomedcentral.com/articles/10.1186/s12911-019-0795-y"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12911-019-0795-y</pub-id>
          <pub-id pub-id-type="medline">30871518</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12911-019-0795-y</pub-id>
          <pub-id pub-id-type="pmcid">PMC6416852</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mitra</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Pradhan</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Melamed</surname>
              <given-names>RD</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Hoaglin</surname>
              <given-names>DC</given-names>
            </name>
            <name name-style="western">
              <surname>Tucker</surname>
              <given-names>KL</given-names>
            </name>
            <name name-style="western">
              <surname>Reisman</surname>
              <given-names>JI</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Tsai</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Associations between natural language processing-enriched social determinants of health and suicide death among US Veterans</article-title>
          <source>JAMA Netw Open</source>
          <year>2023</year>
          <month>03</month>
          <day>01</day>
          <volume>6</volume>
          <issue>3</issue>
          <fpage>e233079</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/36920391"/>
          </comment>
          <pub-id pub-id-type="doi">10.1001/jamanetworkopen.2023.3079</pub-id>
          <pub-id pub-id-type="medline">36920391</pub-id>
          <pub-id pub-id-type="pii">2802468</pub-id>
          <pub-id pub-id-type="pmcid">PMC10018322</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Romanowski</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Ben Abacha</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Fan</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Extracting social determinants of health from clinical note text with classification and sequence-to-sequence approaches</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2023</year>
          <month>07</month>
          <day>19</day>
          <volume>30</volume>
          <issue>8</issue>
          <fpage>1448</fpage>
          <lpage>1455</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/37100768"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamia/ocad071</pub-id>
          <pub-id pub-id-type="medline">37100768</pub-id>
          <pub-id pub-id-type="pii">7143737</pub-id>
          <pub-id pub-id-type="pmcid">PMC10354779</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gu</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Shao</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Liao</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Carducci</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Brufau</surname>
              <given-names>SR</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Desai</surname>
              <given-names>RJ</given-names>
            </name>
          </person-group>
          <article-title>Scalable information extraction from free text electronic health records using large language models</article-title>
          <source>BMC Med Res Methodol</source>
          <year>2025</year>
          <month>01</month>
          <day>28</day>
          <volume>25</volume>
          <issue>1</issue>
          <fpage>23</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedresmethodol.biomedcentral.com/articles/10.1186/s12874-025-02470-z"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12874-025-02470-z</pub-id>
          <pub-id pub-id-type="medline">39871166</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12874-025-02470-z</pub-id>
          <pub-id pub-id-type="pmcid">PMC11773977</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gabriel</surname>
              <given-names>RA</given-names>
            </name>
            <name name-style="western">
              <surname>Litake</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Simpson</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Burton</surname>
              <given-names>BN</given-names>
            </name>
            <name name-style="western">
              <surname>Waterman</surname>
              <given-names>RS</given-names>
            </name>
            <name name-style="western">
              <surname>Macias</surname>
              <given-names>AA</given-names>
            </name>
          </person-group>
          <article-title>On the development and validation of large language model-based classifiers for identifying social determinants of health</article-title>
          <source>Proc Natl Acad Sci U S A</source>
          <year>2024</year>
          <month>09</month>
          <day>24</day>
          <volume>121</volume>
          <issue>39</issue>
          <fpage>e2320716121</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.pnas.org/doi/10.1073/pnas.2320716121?url_ver=Z39.88-2003&#38;rfr_id=ori:rid:crossref.org&#38;rfr_dat=cr_pub  0pubmed"/>
          </comment>
          <pub-id pub-id-type="doi">10.1073/pnas.2320716121</pub-id>
          <pub-id pub-id-type="medline">39284061</pub-id>
          <pub-id pub-id-type="pmcid">PMC11441499</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Guevara</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Thomas</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Chaunzwa</surname>
              <given-names>TL</given-names>
            </name>
            <name name-style="western">
              <surname>Franco</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Kann</surname>
              <given-names>BH</given-names>
            </name>
            <name name-style="western">
              <surname>Moningi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Qian</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Goldstein</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Harper</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Aerts</surname>
              <given-names>HJWL</given-names>
            </name>
            <name name-style="western">
              <surname>Catalano</surname>
              <given-names>PJ</given-names>
            </name>
            <name name-style="western">
              <surname>Savova</surname>
              <given-names>GK</given-names>
            </name>
            <name name-style="western">
              <surname>Mak</surname>
              <given-names>RH</given-names>
            </name>
            <name name-style="western">
              <surname>Bitterman</surname>
              <given-names>DS</given-names>
            </name>
          </person-group>
          <article-title>Large language models to identify social determinants of health in electronic health records</article-title>
          <source>NPJ Digit Med</source>
          <year>2024</year>
          <month>01</month>
          <day>11</day>
          <volume>7</volume>
          <issue>1</issue>
          <fpage>6</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41746-023-00970-0"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41746-023-00970-0</pub-id>
          <pub-id pub-id-type="medline">38200151</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41746-023-00970-0</pub-id>
          <pub-id pub-id-type="pmcid">PMC10781957</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Consoli</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Rousseau</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Hartvigsen</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Shen</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Peng</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Long</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Ding</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>SDoH-GPT: using large language models to extract social determinants of health</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2026</year>
          <month>01</month>
          <day>01</day>
          <volume>33</volume>
          <issue>1</issue>
          <fpage>67</fpage>
          <lpage>78</lpage>
          <pub-id pub-id-type="doi">10.1093/jamia/ocaf094</pub-id>
          <pub-id pub-id-type="medline">40493530</pub-id>
          <pub-id pub-id-type="pii">8159915</pub-id>
          <pub-id pub-id-type="pmcid">PMC12758468</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Keloth</surname>
              <given-names>VK</given-names>
            </name>
            <name name-style="western">
              <surname>Selek</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Gilman</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Fu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Dang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Hu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>He</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Fan</surname>
              <given-names>JW</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Brandt</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Tao</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Social determinants of health extraction from clinical notes across institutions using large language models</article-title>
          <source>NPJ Digit Med</source>
          <year>2025</year>
          <month>05</month>
          <day>17</day>
          <volume>8</volume>
          <issue>1</issue>
          <fpage>287</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41746-025-01645-8"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41746-025-01645-8</pub-id>
          <pub-id pub-id-type="medline">40379919</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41746-025-01645-8</pub-id>
          <pub-id pub-id-type="pmcid">PMC12084648</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Peng</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Dang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Adekkanattu</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Gopal Patra</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Peng</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Pathak</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wilson</surname>
              <given-names>DL</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Lo-Ciganic</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>George</surname>
              <given-names>TJ</given-names>
            </name>
            <name name-style="western">
              <surname>Hogan</surname>
              <given-names>WR</given-names>
            </name>
            <name name-style="western">
              <surname>Guo</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Bian</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Identifying social determinants of health from clinical narratives: a study of performance, documentation ratio, and potential bias</article-title>
          <source>J Biomed Inform</source>
          <year>2024</year>
          <month>05</month>
          <day>01</day>
          <volume>153</volume>
          <fpage>104642</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(24)00060-1"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2024.104642</pub-id>
          <pub-id pub-id-type="medline">38621641</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(24)00060-1</pub-id>
          <pub-id pub-id-type="pmcid">PMC11141428</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Patra</surname>
              <given-names>BG</given-names>
            </name>
            <name name-style="western">
              <surname>Lepow</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Kasi Reddy Jagadeesh Kumar</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Vekaria</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Sharma</surname>
              <given-names>MM</given-names>
            </name>
            <name name-style="western">
              <surname>Adekkanattu</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Fennessy</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Hynes</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Landi</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Sanchez-Ruiz</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Ryu</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Biernacka</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Nadkarni</surname>
              <given-names>GN</given-names>
            </name>
            <name name-style="western">
              <surname>Talati</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Weissman</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Olfson</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Mann</surname>
              <given-names>JJ</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Charney</surname>
              <given-names>AW</given-names>
            </name>
            <name name-style="western">
              <surname>Pathak</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Extracting social support and social isolation information from clinical psychiatry notes: comparing a rule-based natural language processing system and a large language model</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2025</year>
          <volume>32</volume>
          <issue>1</issue>
          <fpage>218</fpage>
          <lpage>226</lpage>
          <pub-id pub-id-type="doi">10.1093/jamia/ocae260</pub-id>
          <pub-id pub-id-type="medline">39423850</pub-id>
          <pub-id pub-id-type="pii">7826739</pub-id>
          <pub-id pub-id-type="pmcid">PMC11648716</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Arora</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Wei</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Hicks</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Bowman</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Quiñonero-Candela</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Tsimpourlas</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Sharman</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Shah</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Vallone</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Beutel</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Heidecke</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Singhal</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>HealthBench: evaluating large language models towards improved human health</article-title>
          <source>arXiv. Preprint posted online May 13, 2025</source>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/2505.08775"/>
          </comment>
          <pub-id pub-id-type="doi">10.48550/arXiv.2505.08775</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Moëll</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Farestam</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Beskow</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Swedish medical LLM benchmark: development and evaluation of a framework for assessing large language models in the Swedish medical domain</article-title>
          <source>Front Artif Intell</source>
          <year>2025</year>
          <month>07</month>
          <day>10</day>
          <volume>8</volume>
          <fpage>1557920</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.3389/frai.2025.1557920"/>
          </comment>
          <pub-id pub-id-type="doi">10.3389/frai.2025.1557920</pub-id>
          <pub-id pub-id-type="medline">40718621</pub-id>
          <pub-id pub-id-type="pmcid">PMC12290221</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lituiev</surname>
              <given-names>DS</given-names>
            </name>
            <name name-style="western">
              <surname>Lacar</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Pak</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Abramowitsch</surname>
              <given-names>PL</given-names>
            </name>
            <name name-style="western">
              <surname>De Marchis</surname>
              <given-names>EH</given-names>
            </name>
            <name name-style="western">
              <surname>Peterson</surname>
              <given-names>TA</given-names>
            </name>
          </person-group>
          <article-title>Automatic extraction of social determinants of health from medical notes of chronic lower back pain patients</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2023</year>
          <month>07</month>
          <day>19</day>
          <volume>30</volume>
          <issue>8</issue>
          <fpage>1438</fpage>
          <lpage>1447</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/37080559"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamia/ocad054</pub-id>
          <pub-id pub-id-type="medline">37080559</pub-id>
          <pub-id pub-id-type="pii">7133957</pub-id>
          <pub-id pub-id-type="pmcid">PMC10354762</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lybarger</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Yetisgen</surname>
              <given-names>M</given-names>
            </name>
            <collab>Uzuner</collab>
          </person-group>
          <article-title>The 2022 n2c2/UW shared task on extracting social determinants of health</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2023</year>
          <month>07</month>
          <day>19</day>
          <volume>30</volume>
          <issue>8</issue>
          <fpage>1367</fpage>
          <lpage>1378</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/36795066"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamia/ocad012</pub-id>
          <pub-id pub-id-type="medline">36795066</pub-id>
          <pub-id pub-id-type="pii">7043152</pub-id>
          <pub-id pub-id-type="pmcid">PMC10354764</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nalichowski</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Keogh</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Chueh</surname>
              <given-names>HC</given-names>
            </name>
            <name name-style="western">
              <surname>Murphy</surname>
              <given-names>SN</given-names>
            </name>
          </person-group>
          <article-title>Calculating the benefits of a Research Patient Data Repository</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2006</year>
          <volume>2006</volume>
          <fpage>1044</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/17238663"/>
          </comment>
          <pub-id pub-id-type="medline">17238663</pub-id>
          <pub-id pub-id-type="pii">85854</pub-id>
          <pub-id pub-id-type="pmcid">PMC1839563</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Karlson</surname>
              <given-names>EW</given-names>
            </name>
            <name name-style="western">
              <surname>Boutin</surname>
              <given-names>NT</given-names>
            </name>
            <name name-style="western">
              <surname>Hoffnagle</surname>
              <given-names>AG</given-names>
            </name>
            <name name-style="western">
              <surname>Allen</surname>
              <given-names>NL</given-names>
            </name>
          </person-group>
          <article-title>Building the Partners HealthCare Biobank at Partners Personalized Medicine: informed consent, return of research results, recruitment lessons and operational considerations</article-title>
          <source>J Pers Med</source>
          <year>2016</year>
          <month>01</month>
          <day>14</day>
          <volume>6</volume>
          <issue>1</issue>
          <fpage>2</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=jpm6010002"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/jpm6010002</pub-id>
          <pub-id pub-id-type="medline">26784234</pub-id>
          <pub-id pub-id-type="pii">jpm6010002</pub-id>
          <pub-id pub-id-type="pmcid">PMC4810381</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <collab>Institute of Medicine</collab>
          </person-group>
          <source>Capturing Social and Behavioral Domains in Electronic Health Records: Phase 1</source>
          <year>2014</year>
          <publisher-loc>Washington, DC</publisher-loc>
          <publisher-name>National Academies Press</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <collab>Institute of Medicine</collab>
          </person-group>
          <source>Capturing Social and Behavioral Domains and Measures in Electronic Health Records: Phase 2</source>
          <year>2014</year>
          <publisher-loc>Washington, DC</publisher-loc>
          <publisher-name>National Academies Press</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hatef</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Rouhizadeh</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Tia</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Lasser</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Hill-Briggs</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Marsteller</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kharrazi</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Assessing the availability of data on social and behavioral determinants in structured and unstructured electronic health records: a retrospective analysis of a multilevel health care system</article-title>
          <source>JMIR Med Inform</source>
          <year>2019</year>
          <month>08</month>
          <day>02</day>
          <volume>7</volume>
          <issue>3</issue>
          <fpage>e13802</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2019/3/e13802/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/13802</pub-id>
          <pub-id pub-id-type="medline">31376277</pub-id>
          <pub-id pub-id-type="pii">v7i3e13802</pub-id>
          <pub-id pub-id-type="pmcid">PMC6696855</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Botelle</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Bhavsar</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Kadra-Scalzo</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Mascio</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Williams</surname>
              <given-names>MV</given-names>
            </name>
            <name name-style="western">
              <surname>Roberts</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Velupillai</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Stewart</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Can natural language processing models extract and classify instances of interpersonal violence in mental healthcare electronic records: an applied evaluative study</article-title>
          <source>BMJ Open</source>
          <year>2022</year>
          <month>02</month>
          <day>16</day>
          <volume>12</volume>
          <issue>2</issue>
          <fpage>e052911</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmjopen.bmj.com/lookup/pmidlookup?view=long&#38;pmid=35172999"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/bmjopen-2021-052911</pub-id>
          <pub-id pub-id-type="medline">35172999</pub-id>
          <pub-id pub-id-type="pii">bmjopen-2021-052911</pub-id>
          <pub-id pub-id-type="pmcid">PMC8852656</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="web">
          <source>Label Studio</source>
          <access-date>2026-04-27</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://labelstud.io/">https://labelstud.io/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Krippendorff</surname>
              <given-names>Klaus</given-names>
            </name>
          </person-group>
          <source>Content Analysis: An Introduction to Its Methodology</source>
          <year>2019</year>
          <publisher-loc>Thousand Oaks, CA</publisher-loc>
          <publisher-name>SAGE Publications</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Marzi</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Balzano</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Marchiori</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>K-alpha calculator–Krippendorff's alpha calculator: a user-friendly tool for computing Krippendorff's alpha inter-rater reliability coefficient</article-title>
          <source>MethodsX</source>
          <year>2024</year>
          <month>06</month>
          <volume>12</volume>
          <fpage>102545</fpage>
          <pub-id pub-id-type="doi">10.1016/j.mex.2023.102545</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Eyre</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Chapman</surname>
              <given-names>AB</given-names>
            </name>
            <name name-style="western">
              <surname>Peterson</surname>
              <given-names>KS</given-names>
            </name>
            <name name-style="western">
              <surname>Shi</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Alba</surname>
              <given-names>PR</given-names>
            </name>
            <name name-style="western">
              <surname>Jones</surname>
              <given-names>MM</given-names>
            </name>
            <name name-style="western">
              <surname>Box</surname>
              <given-names>TL</given-names>
            </name>
            <name name-style="western">
              <surname>DuVall</surname>
              <given-names>SL</given-names>
            </name>
            <name name-style="western">
              <surname>Patterson</surname>
              <given-names>OV</given-names>
            </name>
          </person-group>
          <article-title>Launching into clinical space with medspaCy: a new clinical text processing toolkit in Python</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2021</year>
          <volume>2021</volume>
          <fpage>438</fpage>
          <lpage>447</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/35308962"/>
          </comment>
          <pub-id pub-id-type="medline">35308962</pub-id>
          <pub-id pub-id-type="pii">3576697</pub-id>
          <pub-id pub-id-type="pmcid">PMC8861690</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Stemerman</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Arguello</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Brice</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Krishnamurthy</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Houston</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kitzmiller</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Identification of social determinants of health using multi-label classification of electronic health record clinical notes</article-title>
          <source>JAMIA Open</source>
          <year>2021</year>
          <month>07</month>
          <volume>4</volume>
          <issue>3</issue>
          <fpage>ooaa069</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/34514351"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamiaopen/ooaa069</pub-id>
          <pub-id pub-id-type="medline">34514351</pub-id>
          <pub-id pub-id-type="pii">ooaa069</pub-id>
          <pub-id pub-id-type="pmcid">PMC8423426</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Shenvi</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Quach</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Sutjiadi</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Richardson</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Developing a semantic model to describe physical activity data</article-title>
          <source>Stud Health Technol Inform</source>
          <year>2016</year>
          <volume>225</volume>
          <fpage>447</fpage>
          <lpage>51</lpage>
          <pub-id pub-id-type="medline">27332240</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hollister</surname>
              <given-names>BM</given-names>
            </name>
            <name name-style="western">
              <surname>Restrepo</surname>
              <given-names>NA</given-names>
            </name>
            <name name-style="western">
              <surname>Farber-Eger</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Crawford</surname>
              <given-names>DC</given-names>
            </name>
            <name name-style="western">
              <surname>Aldrich</surname>
              <given-names>MC</given-names>
            </name>
            <name name-style="western">
              <surname>Non</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Development and performance of text-mining algorithms to extract socioeconomic status from de-identified electronic health records</article-title>
          <source>Pacific Symposium on Biocomputing</source>
          <year>2017</year>
          <volume>22</volume>
          <fpage>230</fpage>
          <lpage>241</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://psb.stanford.edu/psb-online/proceedings/psb17/abstracts/2017_p230.html"/>
          </comment>
          <pub-id pub-id-type="doi">10.1142/9789813207813_0023</pub-id>
          <pub-id pub-id-type="medline">27896978</pub-id>
          <pub-id pub-id-type="pii">9789813207813_0023</pub-id>
          <pub-id pub-id-type="pmcid">PMC5147499</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Winden</surname>
              <given-names>TJ</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>ES</given-names>
            </name>
            <name name-style="western">
              <surname>Monsen</surname>
              <given-names>KA</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Melton</surname>
              <given-names>GB</given-names>
            </name>
          </person-group>
          <article-title>Evaluation of flowsheet documentation in the electronic health record for residence, living situation, and living conditions</article-title>
          <source>AMIA Jt Summits Transl Sci Proc</source>
          <year>2018</year>
          <volume>2017</volume>
          <fpage>236</fpage>
          <lpage>245</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/29888079"/>
          </comment>
          <pub-id pub-id-type="medline">29888079</pub-id>
          <pub-id pub-id-type="pmcid">PMC5961798</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Feller</surname>
              <given-names>DJ</given-names>
            </name>
            <name name-style="western">
              <surname>Zucker</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Don't Walk</surname>
              <given-names>OB</given-names>
            </name>
            <name name-style="western">
              <surname>Srikishan</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Martinez</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Evans</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Yin</surname>
              <given-names>MT</given-names>
            </name>
            <name name-style="western">
              <surname>Gordon</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Elhadad</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Towards the inference of social and behavioral determinants of sexual health: development of a gold-standard corpus with semi-supervised learning</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2018</year>
          <volume>2018</volume>
          <fpage>422</fpage>
          <lpage>429</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/30815082"/>
          </comment>
          <pub-id pub-id-type="medline">30815082</pub-id>
          <pub-id pub-id-type="pmcid">PMC6371339</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pennington</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Socher</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Manning</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>GloVe: Global Vectors for Word Representation</article-title>
          <year>2014</year>
          <conf-name>The 2014 Conference on Empirical Methods in Natural Language Processing</conf-name>
          <conf-date>October 25-29, 2014</conf-date>
          <conf-loc>Doha, Qatar</conf-loc>
          <publisher-loc>New York, NY</publisher-loc>
          <publisher-name>Association for Computational Linguistics (ACL)</publisher-name>
          <fpage>1532</fpage>
          <lpage>1543</lpage>
          <pub-id pub-id-type="doi">10.3115/v1/D14-1162</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bojanowski</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Grave</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Joulin</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Mikolov</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Enriching word vectors with subword information</article-title>
          <source>Transactions of the Association for Computational Linguistics</source>
          <year>2017</year>
          <month>12</month>
          <volume>5</volume>
          <fpage>135</fpage>
          <lpage>146</lpage>
          <pub-id pub-id-type="doi">10.1162/tacl_a_00051</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>BioWordVec, improving biomedical word embeddings with subword information and MeSH</article-title>
          <source>Sci Data</source>
          <year>2019</year>
          <month>05</month>
          <day>10</day>
          <volume>6</volume>
          <issue>1</issue>
          <fpage>52</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/31076572"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41597-019-0055-0</pub-id>
          <pub-id pub-id-type="medline">31076572</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41597-019-0055-0</pub-id>
          <pub-id pub-id-type="pmcid">PMC6510737</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Peng</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>BioSentVec: creating sentence embeddings for biomedical texts</article-title>
          <year>2019</year>
          <conf-name>2019 IEEE International Conference on Healthcare Informatics (ICHI)</conf-name>
          <conf-date>June 10-13, 2019</conf-date>
          <conf-loc>Xi'an, China</conf-loc>
          <publisher-loc>New York, NY</publisher-loc>
          <publisher-name>IEEE</publisher-name>
          <pub-id pub-id-type="doi">10.1109/ichi.2019.8904728</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Reimers</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Gurevych</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>Sentence-BERT: sentence embeddings using Siamese BERT-networks</article-title>
          <year>2019</year>
          <month>11</month>
          <conf-name>The 2019 Conference on Empirical Methods in Natural Language Processing</conf-name>
          <conf-date>November 3-7, 2019</conf-date>
          <conf-loc>Hong Kong, China</conf-loc>
          <publisher-loc>New York, NY</publisher-loc>
          <publisher-name>Association for Computational Linguistics</publisher-name>
          <pub-id pub-id-type="doi">10.18653/v1/d19-1410</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Michalopoulos</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Kaka</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Wong</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>UmlsBERT: clinical domain knowledge augmentation of contextual embeddings using the Unified Medical Language System Metathesaurus</article-title>
          <year>2021</year>
          <month>06</month>
          <conf-name>The 2021 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies</conf-name>
          <conf-date>June 6-11, 2021</conf-date>
          <conf-loc>Online</conf-loc>
          <publisher-loc>New York, NY</publisher-loc>
          <publisher-name>Association for Computational Linguistics</publisher-name>
          <fpage>1744</fpage>
          <lpage>1753</lpage>
          <pub-id pub-id-type="doi">10.18653/v1/2021.naacl-main.139</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Tormey</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>McCreedy</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Browne</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Generating the MEDLINE N-gram set</article-title>
          <year>2015</year>
          <conf-name>AMIA Annual Symposium</conf-name>
          <conf-date>November 14-18, 2015</conf-date>
          <conf-loc>San Francisco, CA</conf-loc>
          <fpage>1569</fpage>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Tormey</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>McCreedy</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Browne</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Generating a distilled N-gram set - effective lexical multiword building in the SPECIALIST lexicon</article-title>
          <year>2017</year>
          <month>02</month>
          <conf-name>The 10th International Joint Conference on Biomedical Engineering Systems and Technologies (BIOSTEC 2017)</conf-name>
          <conf-date>February 21-23, 2017</conf-date>
          <conf-loc>Porto, Portugal</conf-loc>
          <fpage>77</fpage>
          <lpage>87</lpage>
          <pub-id pub-id-type="doi">10.5220/0006142000770087</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="web">
          <source>GitHub</source>
          <access-date>2026-04-27</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://github.com/bwang482/SDoH_Extraction">https://github.com/bwang482/SDoH_Extraction</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Koo</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Blum</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Black</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Kao</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Fei</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Scalzo</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Kurtz</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>Benchmarking open-source large language models, GPT-4 and Claude 2 on multiple-choice questions in nephrology</article-title>
          <source>NEJM AI</source>
          <year>2024</year>
          <month>01</month>
          <day>17</day>
          <volume>1</volume>
          <issue>2</issue>
          <fpage>AIdbp2300092</fpage>
          <pub-id pub-id-type="doi">10.1056/aidbp2300092</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Hu</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Safari</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>X</given-names>
            </name>
          </person-group>
          <article-title>Capabilities of GPT-5 on multimodal medical reasoning</article-title>
          <source>arXiv. Preprint posted online August 11, 2025</source>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/2508.08224"/>
          </comment>
          <pub-id pub-id-type="doi">10.48550/arXiv.2508.08224</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chung</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Hou</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Longpre</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zoph</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Tay</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Fedus</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Dehghani</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Brahma</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Webson</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Gu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Dai</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Suzgun</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Chowdhery</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Castro-Ros</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Pellat</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Robinson</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Valter</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Narang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Mishra</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Dai</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Petrov</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Chi</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Dean</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Devlin</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Roberts</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Le</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Wei</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Scaling instruction-finetuned language models</article-title>
          <source>Journal of Machine Learning Research</source>
          <year>2024</year>
          <month>01</month>
          <day>01</day>
          <fpage>3381</fpage>
          <lpage>3433</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://jmlr.org/papers/v25/23-0870.html"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref49">
        <label>49</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ouyang</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Jiang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Almeida</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Wainwright</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Mishkin</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Agarwal</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Slama</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Ray</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Schulman</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Hilton</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kelton</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Miller</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Simens</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Askell</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Welinder</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Christiano</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Leike</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Lowe</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Training language models to follow instructions with human feedback</article-title>
          <source>NIPS'22: Proceedings of the 36th International Conference on Neural Information Processing System</source>
          <year>2022</year>
          <conf-name>NIPS'22: 36th International Conference on Neural Information Processing Systems</conf-name>
          <conf-date>December 9, 2022</conf-date>
          <conf-loc>New Orleans, LA</conf-loc>
          <fpage>27730</fpage>
          <lpage>27744</lpage>
          <pub-id pub-id-type="doi">10.52202/068431-2011</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref50">
        <label>50</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wei</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Bosma</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Guu</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Lester</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Du</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Dai</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Le</surname>
              <given-names>Q</given-names>
            </name>
          </person-group>
          <article-title>Finetuned language models are zero-shot learners</article-title>
          <year>2022</year>
          <conf-name>International Conference on Learning Representations</conf-name>
          <conf-date>April 25, 2022</conf-date>
          <conf-loc>Online</conf-loc>
        </nlm-citation>
      </ref>
      <ref id="ref51">
        <label>51</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sanh</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Webson</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Raffel</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Bach</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Sutawika</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Alyafeai</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Chaffin</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Stiegler</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Raja</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Dey</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Bari</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Thakker</surname>
              <given-names>U</given-names>
            </name>
            <name name-style="western">
              <surname>Sharma</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Szczechla</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Chhablani</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Nayak</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Datta</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Jiang</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Manica</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Shen</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Yong</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Pandey</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Bawden</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Neeraj</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Rozen</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Sharma</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Santilli</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Févry</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Fries</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Teehan</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Scao</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Biderman</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Gao</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Wolf</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Rush</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Multitask prompted training enables zero-shot task generalization</article-title>
          <year>2022</year>
          <conf-name>International Conference on Learning Representations</conf-name>
          <conf-date>April 25, 2022</conf-date>
          <conf-loc>Online</conf-loc>
          <pub-id pub-id-type="doi">10.18653/v1/2022.acl-demo.9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref52">
        <label>52</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Du</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Peng</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Keloth</surname>
              <given-names>VK</given-names>
            </name>
            <name name-style="western">
              <surname>Zuo</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Jiang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Roberts</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Improving large language models for clinical named entity recognition via prompt engineering</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2024</year>
          <month>01</month>
          <day>27</day>
          <fpage>1812</fpage>
          <lpage>1820</lpage>
          <pub-id pub-id-type="doi">10.1093/jamia/ocad259</pub-id>
          <pub-id pub-id-type="medline">38281112</pub-id>
          <pub-id pub-id-type="pii">7590607</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref53">
        <label>53</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Fu</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Ye</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>More agents is all you need</article-title>
          <source>Transactions on Machine Learning Research</source>
          <year>2024</year>
          <month>10</month>
          <fpage>1</fpage>
          <lpage>18</lpage>
          <comment>(forthcoming)<ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://openreview.net/pdf?id=bgzUSZ8aeg"/></comment>
        </nlm-citation>
      </ref>
      <ref id="ref54">
        <label>54</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Pang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Xiao</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Xia</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Merge, ensemble, and cooperate! A survey on collaborative strategies in the era of large language models</article-title>
          <source>arXiv. Preprint posted online July 8, 2024</source>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/2407.06089"/>
          </comment>
          <pub-id pub-id-type="doi">10.48550/arXiv.2407.06089</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref55">
        <label>55</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Luo</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Mao</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Xiao</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Ban</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>PS</given-names>
            </name>
          </person-group>
          <article-title>Harnessing multiple large language models: a survey on LLM ensemble</article-title>
          <source>arXiv. Preprint posted online February 25, 2025</source>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/2502.18036"/>
          </comment>
          <pub-id pub-id-type="doi">10.48550/arXiv.2502.18036</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref56">
        <label>56</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Xiao</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Fang</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Large language model synergy for ensemble learning in medical question answering: design and evaluation study</article-title>
          <source>J Med Internet Res</source>
          <year>2025</year>
          <month>07</month>
          <day>14</day>
          <volume>27</volume>
          <fpage>e70080</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2025//e70080/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/70080</pub-id>
          <pub-id pub-id-type="medline">40658884</pub-id>
          <pub-id pub-id-type="pii">v27i1e70080</pub-id>
          <pub-id pub-id-type="pmcid">PMC12337233</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref57">
        <label>57</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ramachandran</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Fu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Han</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Lybarger</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Dobbins</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Uzuner</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Yetisgen</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Prompt-based extraction of social determinants of health using few-shot learning</article-title>
          <year>2023</year>
          <conf-name>The 5th Clinical Natural Language Processing Workshop</conf-name>
          <conf-date>July 14, 2023</conf-date>
          <conf-loc>Toronto, Canada</conf-loc>
          <publisher-loc>New York, NY</publisher-loc>
          <publisher-name>Association for Computational Linguistics</publisher-name>
          <pub-id pub-id-type="doi">10.18653/v1/2023.clinicalnlp-1.41</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref58">
        <label>58</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Brignone</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>LeJeune</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Mihalko</surname>
              <given-names>AE</given-names>
            </name>
            <name name-style="western">
              <surname>Shannon</surname>
              <given-names>AL</given-names>
            </name>
            <name name-style="western">
              <surname>Sinoway</surname>
              <given-names>LI</given-names>
            </name>
          </person-group>
          <article-title>Self-reported social determinants of health and area-level social vulnerability</article-title>
          <source>JAMA Netw Open</source>
          <year>2024</year>
          <month>05</month>
          <day>01</day>
          <volume>7</volume>
          <issue>5</issue>
          <fpage>e2412109</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/38767915"/>
          </comment>
          <pub-id pub-id-type="doi">10.1001/jamanetworkopen.2024.12109</pub-id>
          <pub-id pub-id-type="medline">38767915</pub-id>
          <pub-id pub-id-type="pii">2818856</pub-id>
          <pub-id pub-id-type="pmcid">PMC11107301</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref59">
        <label>59</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Tan</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Padman</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Social determinants of health in electronic health records and their impact on analysis and risk prediction: a systematic review</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2020</year>
          <month>11</month>
          <day>01</day>
          <volume>27</volume>
          <issue>11</issue>
          <fpage>1764</fpage>
          <lpage>1773</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/33202021"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamia/ocaa143</pub-id>
          <pub-id pub-id-type="medline">33202021</pub-id>
          <pub-id pub-id-type="pii">5959858</pub-id>
          <pub-id pub-id-type="pmcid">PMC7671639</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref60">
        <label>60</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mitra</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Kessler</surname>
              <given-names>RC</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Post-discharge suicide prediction among US veterans using natural language processing-enriched social and behavioral determinants of health</article-title>
          <source>Npj Ment Health Res</source>
          <year>2025</year>
          <month>02</month>
          <day>22</day>
          <volume>4</volume>
          <issue>1</issue>
          <fpage>8</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s44184-025-00120-2"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s44184-025-00120-2</pub-id>
          <pub-id pub-id-type="medline">39987238</pub-id>
          <pub-id pub-id-type="pii">10.1038/s44184-025-00120-2</pub-id>
          <pub-id pub-id-type="pmcid">PMC11846906</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref61">
        <label>61</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kwak</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Pollard</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Celi</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Ghassemi</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Evaluating the impact of social determinants on health prediction in the intensive care unit</article-title>
          <year>2023</year>
          <conf-name>The 2023 AAAI/ACM Conference on AI, Ethics, and Society</conf-name>
          <conf-date>August 8-10, 2023</conf-date>
          <conf-loc>Montréal, Canada</conf-loc>
          <publisher-loc>New York, NY</publisher-loc>
          <publisher-name>Association for Computing Machinery</publisher-name>
          <fpage>333</fpage>
          <lpage>350</lpage>
          <pub-id pub-id-type="doi">10.1145/3600211.3604719</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref62">
        <label>62</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hartzler</surname>
              <given-names>AL</given-names>
            </name>
            <name name-style="western">
              <surname>Xie</surname>
              <given-names>SJ</given-names>
            </name>
            <name name-style="western">
              <surname>Wedgeworth</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Spice</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Lybarger</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Wood</surname>
              <given-names>BR</given-names>
            </name>
            <name name-style="western">
              <surname>Duber</surname>
              <given-names>HC</given-names>
            </name>
            <name name-style="western">
              <surname>Hsieh</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Singh</surname>
              <given-names>AP</given-names>
            </name>
            <collab>SDoH Community Champion Advisory Board</collab>
          </person-group>
          <article-title>Integrating patient voices into the extraction of social determinants of health from clinical notes: ethical considerations and recommendations</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2023</year>
          <month>07</month>
          <day>19</day>
          <volume>30</volume>
          <issue>8</issue>
          <fpage>1456</fpage>
          <lpage>1462</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/36944091"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamia/ocad043</pub-id>
          <pub-id pub-id-type="medline">36944091</pub-id>
          <pub-id pub-id-type="pii">7082925</pub-id>
          <pub-id pub-id-type="pmcid">PMC10354781</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref63">
        <label>63</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Na</surname>
              <given-names>PJ</given-names>
            </name>
            <name name-style="western">
              <surname>Shin</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kwak</surname>
              <given-names>HR</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Jester</surname>
              <given-names>DJ</given-names>
            </name>
            <name name-style="western">
              <surname>Bandara</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>JY</given-names>
            </name>
            <name name-style="western">
              <surname>Moutier</surname>
              <given-names>CY</given-names>
            </name>
            <name name-style="western">
              <surname>Pietrzak</surname>
              <given-names>RH</given-names>
            </name>
            <name name-style="western">
              <surname>Oquendo</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Jeste</surname>
              <given-names>DV</given-names>
            </name>
          </person-group>
          <article-title>Social determinants of health and suicide-related outcomes: a review of meta-analyses</article-title>
          <source>JAMA Psychiatry</source>
          <year>2025</year>
          <month>01</month>
          <day>02</day>
          <volume>82</volume>
          <issue>4</issue>
          <fpage>337</fpage>
          <lpage>346</lpage>
          <pub-id pub-id-type="doi">10.1001/jamapsychiatry.2024.4241</pub-id>
          <pub-id pub-id-type="medline">39745761</pub-id>
          <pub-id pub-id-type="pii">2828935</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref64">
        <label>64</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Papini</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Hsin</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Kipnis</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>VX</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Girard</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Sterling</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Iturralde</surname>
              <given-names>EM</given-names>
            </name>
          </person-group>
          <article-title>Validation of a multivariable model to predict suicide attempt in a mental health intake sample</article-title>
          <source>JAMA Psychiatry</source>
          <year>2024</year>
          <month>07</month>
          <day>01</day>
          <volume>81</volume>
          <issue>7</issue>
          <fpage>700</fpage>
          <lpage>707</lpage>
          <pub-id pub-id-type="doi">10.1001/jamapsychiatry.2024.0189</pub-id>
          <pub-id pub-id-type="medline">38536187</pub-id>
          <pub-id pub-id-type="pii">2816805</pub-id>
          <pub-id pub-id-type="pmcid">PMC10974695</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
