<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article article-type="review-article" dtd-version="2.0" xmlns:xlink="http://www.w3.org/1999/xlink">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMI</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Med Inform</journal-id>
      <journal-title>JMIR Medical Informatics</journal-title>
      <issn pub-type="epub">2291-9694</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v12i1e60164</article-id>
      <article-id pub-id-type="pmid">39432345</article-id>
      <article-id pub-id-type="doi">10.2196/60164</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Review</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Review</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Health Care Language Models and Their Fine-Tuning for Information Extraction: Scoping Review</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Castonguay</surname>
            <given-names>Alexandre</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Kocian</surname>
            <given-names>Alexander</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Carvalho</surname>
            <given-names>Deborah Ribeiro</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author">
          <name name-style="western">
            <surname>Nunes</surname>
            <given-names>Miguel</given-names>
          </name>
          <degrees>BSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-4909-6341</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Bone</surname>
            <given-names>Joao</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-3359-9780</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Ferreira</surname>
            <given-names>Joao C</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff3" ref-type="aff">3</xref>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-6662-0806</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Elvas</surname>
            <given-names>Luis B</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff3" ref-type="aff">3</xref>
          <address>
            <institution>Department of Logistics, Molde, University College</institution>
            <addr-line>Britvegen 2, Noruega</addr-line>
            <addr-line>Molde, 6410</addr-line>
            <country>Norway</country>
            <phone>47 969152334</phone>
            <email>luis.m.elvas@himolde.no</email>
          </address>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-7489-4380</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>ISTAR</institution>
        <institution>Instituto Universitário de Lisboa (ISCTE-IUL)</institution>
        <addr-line>Lisbon</addr-line>
        <country>Portugal</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Select Data</institution>
        <addr-line>Anaheim, CA</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Department of Logistics, Molde, University College</institution>
        <addr-line>Molde</addr-line>
        <country>Norway</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>INOV Inesc Inovação</institution>
        <institution>Instituto de Novas Tecnologias</institution>
        <addr-line>Lisbon</addr-line>
        <country>Portugal</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Luis B Elvas <email>luis.m.elvas@himolde.no</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2024</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>21</day>
        <month>10</month>
        <year>2024</year>
      </pub-date>
      <volume>12</volume>
      <elocation-id>e60164</elocation-id>
      <history>
        <date date-type="received">
          <day>3</day>
          <month>5</month>
          <year>2024</year>
        </date>
        <date date-type="rev-request">
          <day>13</day>
          <month>6</month>
          <year>2024</year>
        </date>
        <date date-type="rev-recd">
          <day>14</day>
          <month>7</month>
          <year>2024</year>
        </date>
        <date date-type="accepted">
          <day>6</day>
          <month>8</month>
          <year>2024</year>
        </date>
      </history>
      <copyright-statement>©Miguel Nunes, Joao Bone, Joao C Ferreira, Luis B Elvas. Originally published in JMIR Medical Informatics (https://medinform.jmir.org), 21.10.2024.</copyright-statement>
      <copyright-year>2024</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Informatics, is properly cited. The complete bibliographic information, a link to the original publication on https://medinform.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://medinform.jmir.org/2024/1/e60164" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>In response to the intricate language, specialized terminology outside everyday life, and the frequent presence of abbreviations and acronyms inherent in health care text data, domain adaptation techniques have emerged as crucial to transformer-based models. This refinement in the knowledge of the language models (LMs) allows for a better understanding of the medical textual data, which results in an improvement in medical downstream tasks, such as information extraction (IE). We have identified a gap in the literature regarding health care LMs. Therefore, this study presents a scoping literature review investigating domain adaptation methods for transformers in health care, differentiating between English and non-English languages, focusing on Portuguese. Most specifically, we investigated the development of health care LMs, with the aim of comparing Portuguese with other more developed languages to guide the path of a non–English-language with fewer resources.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>This study aimed to research health care IE models, regardless of language, to understand the efficacy of transformers and what are the medical entities most commonly extracted.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>This scoping review was conducted using the PRISMA-ScR (Preferred Reporting Items for Systematic reviews and Meta-Analyses extension for Scoping Reviews) methodology on Scopus and Web of Science Core Collection databases. Only studies that mentioned the creation of health care LMs or health care IE models were included, while large language models (LLMs) were excluded. The latest were not included since we wanted to research LMs and not LLMs, which are architecturally different and have distinct purposes.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>Our search query retrieved 137 studies, 60 of which met the inclusion criteria, and none of them were systematic literature reviews. English and Chinese are the languages with the most health care LMs developed. These languages already have disease-specific LMs, while others only have general–health care LMs. European Portuguese does not have any public health care LM and should take examples from other languages to develop, first, general-health care LMs and then, in an advanced phase, disease-specific LMs. Regarding IE models, transformers were the most commonly used method, and named entity recognition was the most popular topic, with only a few studies mentioning Assertion Status or addressing medical lexical problems. The most extracted entities were diagnosis, posology, and symptoms.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>The findings indicate that domain adaptation is beneficial, achieving better results in downstream tasks. Our analysis allowed us to understand that the use of transformers is more developed for the English and Chinese languages. European Portuguese lacks relevant studies and should draw examples from other non-English languages to develop these models and drive progress in AI. Health care professionals could benefit from highlighting medically relevant information and optimizing the reading of the textual data, or this information could be used to create patient medical timelines, allowing for profiling.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>language model</kwd>
        <kwd>information extraction</kwd>
        <kwd>healthcare</kwd>
        <kwd>PRISMA-ScR</kwd>
        <kwd>scoping literature review</kwd>
        <kwd>transformers</kwd>
        <kwd>natural language processing</kwd>
        <kwd>European Portuguese</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>The health care sector generates a vast amount of structured and unstructured data, including images from medical exams, text written in electronic medical records (EMRs) or Electronic Health Records (EHRs), and structured data from relational databases that store patient and admission information, as well as all the data collected during a patient’s hospitalization [<xref ref-type="bibr" rid="ref1">1</xref>]. Approximately 30% of the world’s data volume is generated by the health care sector, and projections indicate that by 2025, the compound annual growth rate of data for health care will reach 36% [<xref ref-type="bibr" rid="ref2">2</xref>].</p>
      <p>Medical texts present several challenges due to the use of unfamiliar context-specific terminologies that differ from everyday language. In addition, physicians often use abbreviations and acronyms to save time and space. However, the same abbreviation can have different meanings, adding an additional layer of complexity when trying to understand the content of medical texts [<xref ref-type="bibr" rid="ref3">3</xref>]. All these characteristics pose challenges when attempting to apply artificial intelligence (AI) techniques to interpret the text.</p>
      <p>In the field of natural language processing (NLP), the introduction of transformers [<xref ref-type="bibr" rid="ref4">4</xref>] has revolutionized the field, achieving state-of-the-art performance for numerous NLP tasks [<xref ref-type="bibr" rid="ref5">5</xref>]. Their general architecture comprises an encoder, which receives the input and builds a representation of it, and a decoder that uses the encoder’s representation along with other inputs to generate a target sequence. The introduction of the self-attention mechanism further revolutionized NLP by allowing the model to weigh the importance of different words in a sentence regardless of their position. This enables better handling of long-range dependencies compared with traditional deep learning (DL) architectures like recurrent neural networks (RNNs) and long short-term memory Networks [<xref ref-type="bibr" rid="ref6">6</xref>]. In the context of medical text, transformers excel in interpreting and extracting medically relevant information by effectively handling context and meaning, even in complex and specialized language.</p>
      <p>Transformers can be trained as language models (LMs) on raw text in a self-supervised manner, enabling them to develop a statistical understanding of the text they were trained on [<xref ref-type="bibr" rid="ref7">7</xref>]. However, the benefits of this approach are only fully realized when fine-tuning a downstream task.</p>
      <p>Another important concept is called domain adaptation, which stands for the process of adapting or adjusting something to be suitable within a different domain or context. In the field of machine learning (ML), domain adaptation is used to align the disparity between domains so that the trained model can generalize into the domain of interest [<xref ref-type="bibr" rid="ref8">8</xref>]. For transformers, domain adaptation involves continuing the pretraining of an LM with text data from a different domain than the one it was originally trained on [<xref ref-type="bibr" rid="ref9">9</xref>]. This approach allows for leveraging the learning capabilities of general-scope LMs and refining them for specific contexts. For example, if we consider a general-scope LM, one that was trained using textual data from various domains, and continue its pretraining with health care–specific textual data, it will help the LM to refine its understanding of the health care data, leading to improvements when fine-tuning the LM for downstream tasks related to health care. To explore this further, we can take a health care LM who was trained using EMRs from a hospital and continue its pretraining using only text from patients with a specific disease. It will allow the LM to adjust its weights and become more precise when interpreting texts related to that particular disease.</p>
      <p>An example of domain adaptation is the BioBERT model [<xref ref-type="bibr" rid="ref10">10</xref>], which resulted from the continuation of the pretraining of the Bidirectional Encoder Representations from Transformers (BERT) [<xref ref-type="bibr" rid="ref10">10</xref>] model on biomedical text. The BioBERT model outperformed its predecessor in biomedical named entity recognition (NER), relation extraction, and question-answering tasks. Alzheimer’s Disease-BERT [<xref ref-type="bibr" rid="ref11">11</xref>] and CancerBERT [<xref ref-type="bibr" rid="ref12">12</xref>] are 2 examples of applying domain adaptation to a more restricted domain. Both models outperformed their respective baselines on downstream tasks related to their respective diseases. Summing up, performing domain adaptation for the health care sector appears inevitable to improve results, for example, for information extraction (IE) models, where a better understanding of medical terminologies and lexicon would make it easier to identify and extract information [<xref ref-type="bibr" rid="ref13">13</xref>].</p>
      <p>The European Portuguese (PT-PT) language does not generate the same amount of data as the English language, resulting in limitations in the literature and the published models. A study published in 2023 by the Ernst &amp; Young Audit highlights the following areas where AI can play a relevant role in Portugal’s health care; disease diagnoses, precision medicine, remote monitoring and prevention, data management and hospital efficiency, and health policies [<xref ref-type="bibr" rid="ref14">14</xref>]. Recently, a project was launched in Portugal, funded by the European Union, with the aim of creating PT-PT NLP solutions for the health care sector. Under this scope, the objective is to create PT-PT medical LM and IE models to automatically identify medically relevant entities.</p>
      <p>Therefore, in this study, we aim to present a scoping literature review (SLR), in which we will begin by exploring the creation of health care LMs through domain adaptation and analyze their results. In addition, we aim to focus on the geographical domain to understand the current state-of-the-art for the Portuguese language and compare it to other, potentially more developed, languages to identify further steps. We also want to explore IE models in the health care sector, regardless of their data language, to understand the most commonly extracted medical entities and the methods used in doing so. Despite the literature being rich in studies focused on health care large language models (LLMs), there is a lack of studies that evaluate the current state-of-the-art of health care LMs not only in English but also in other less-resourced languages. This will enable us to grasp how the community is using the capabilities of transformers and whether the advantages of using them are indeed present in the health care domain. In addition, researchers will have 1 study about health care LMs that could guide their path and help them understand how the literature has developed in their respective languages. Finally, we will present the corresponding discussion and the conclusion drawn from the SLR.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Overview</title>
        <p>To complete our goal, we have conducted an SLR to gain a better understanding of the research conducted in the application of health care–domain LMs and the development of IE models within the health care domain. In the first stage, our study encompasses health care–domain LMs in various languages, with a focus on the Portuguese language. In the second stage, we searched for studies related to IE models to evaluate the methods most frequently used. In terms of methodology, we followed the PRISMA-ScR (Preferred Reporting Items for Systematic reviews and Meta-Analyses extension for Scoping Reviews) [<xref ref-type="bibr" rid="ref15">15</xref>] to ensure a systematic and transparent approach in conducting and reporting our scoping review.</p>
      </sec>
      <sec>
        <title>Search Strategy and Inclusion Criteria</title>
        <p>This SLR was conducted in November 2023 and focused exclusively on studies and reviews published in journals within the last 5 years (2019-2023) that were written in English or Portuguese. It was not an arbitrary data range since limiting the search to the last 5 years ensures that the review includes the most recent and relevant studies, reflecting the latest advancements, technologies, and methodologies in the field. Since BERT [<xref ref-type="bibr" rid="ref10">10</xref>], one of the most popular transformer architectures, and LM were launched at the end of 2018, we searched for studies from 2019 onward. The primary databases used for this review were Scopus [<xref ref-type="bibr" rid="ref16">16</xref>] and the Web of Science Core Collection (WOSCC) [<xref ref-type="bibr" rid="ref17">17</xref>] since both databases are renowned for indexing a wide array of peer-reviewed journals across multidisciplinary fields [<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref19">19</xref>]. While acknowledging that additional databases might offer further insights, the significant overlap with these resources ensures that relevant studies are unlikely to be missed.</p>
        <p>The criteria were defined to include studies focused on continuing the pretraining of LMs to achieve health care–domain LMs or studies focused on creating IE models within the health care field. Therefore, we formulated a query that includes the training or fine-tuning LMs or IE Models within the context of health care or similar, using EMRs or EHRs as data.</p>
        <p>Since there is a significant semantic similarity between LMs and LLMs, we decided to exclude the second from the search query because it has a different purpose from the aim of our study. LLMs are typically composed of more than 7B parameters and are suited for text generation. LMs are models that are not, by themselves, suited to perform any downstream NLP task, needing to be readjusted or fine-tuned with labeled data to be able to perform downstream tasks.</p>
        <p>Our final query is as follows: “(“Language Model” OR “Masked Language Model” OR “Information Extraction” OR “Content Extraction”) AND (“EHR” OR “EMR” OR “Electronic Health Record” OR “Electronic Medical Record”) AND (“Fine-Tuned” OR “Fine-tuning” OR “Training” OR “Trained”) AND (“Healthcare” OR “Health Care” OR “Clinical” OR “Medical”) AND NOT (“Large Language Model” OR “LLM”).”</p>
        <p>According to our objectives, a study was considered valid if it documented a continuation of the pretraining of an LM to create a health care LM or if it focused on the creation of health care IE models.</p>
      </sec>
      <sec>
        <title>Study Selection</title>
        <p>To minimize the risk of bias in the study selection, the process was conducted independently by 3 researchers. A total of 2 researchers were responsible for reading and judging the studies according to the inclusion criteria, while the third researcher was involved in cases of disagreement.</p>
      </sec>
      <sec>
        <title>Data Charting and Synthesis</title>
        <p>A data-charting form was jointly developed by two reviewers to extract relevant information from the selected studies systematically. The form included variables such as study title, year of publication, language focus (English or non-English), domain adaptation techniques for Transformer-based models, healthcare-specific information extraction tasks, evaluation metrics used, and the specific health-related entities being extracted. Both reviewers independently charted the data to ensure comprehensive coverage of healthcare language models in English and non-English languages, with particular attention to languages other than English (referred to as non-English). Discrepancies in the extracted data were discussed and resolved through consensus. As the review progressed, the data-charting form was iteratively updated to capture emerging themes, especially regarding the disparity between language resources and technological development for healthcare information extraction across different languages.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <p>The query retrieved 137 papers, with the vast majority of these studies being retrieved from Scopus, adding up to 90 when compared with the 47 studies WOSCC has yielded. The PRISMA-ScR methodology was then followed, as seen in <xref rid="figure1" ref-type="fig">Figure 1</xref>. Since we included studies from sources beyond the 2 selected databases, we adhered to the updated PRISMA-ScR guideline [<xref ref-type="bibr" rid="ref20">20</xref>]. In the following subsections, we explained the decision to include studies by other methods.</p>
      <p>The first step was to identify and remove duplicated papers, resulting in 101 studies. Following a screening of titles and abstracts, 10 records were deemed out of scope, and 1 could not be retrieved, leaving us with 90 fully reviewed studies.</p>
      <p>After screening all the papers that matched our criteria, we realized that 30 of them did not meet our inclusion criteria. Some studies referred to the fine-tuning of pretrained LMs for tasks unrelated to IE, or they lacked relevant information to contribute to this study, or even though we excluded them from our search query, they mentioned the use of LLMs.</p>
      <p>As we were focused on the Portuguese language, our study also emphasized the geographical domain, with an aim to comprehend the medical data language used in health care LMs. <xref ref-type="table" rid="table1">Table 1</xref> resumes the studies focused on the pretraining of LMs separated by the language of their data.</p>
      <p>From the reading of <xref ref-type="table" rid="table1">Table 1</xref>, we can understand that English is the main language, which can be explained by the much higher availability of English data and the overwhelming presence and applicability of this language throughout the world. However, we notice that in the Chinese language, there are studies attempting to fill the gap of being non-English, creating in-domain LMs aware of their benefits. We also found studies in Brazilian Portuguese (PT-BR), Spanish, and PT-PT, and we acknowledge that there might be other studies in different languages, even though they did not match our search query criteria.</p>
      <p>Changing the view for the health care IE studies, <xref rid="figure2" ref-type="fig">Figure 2</xref> resumes the distribution of studies by topic.</p>
      <p>From the reading of <xref rid="figure2" ref-type="fig">Figure 2</xref>, NER appears as the main topic on the IE, with only 2 studies performing Assertion Status and 3 studies focused on solving medical lexical problems.</p>
      <p>To provide a more in-depth review of each study, we present the subsequent 3 subsections where we differentiate between non-Portuguese health care LMs, Portuguese health care LMs, and health care IE models.</p>
      <fig id="figure1" position="float">
        <label>Figure 1</label>
        <caption>
          <p>PRISMA-ScR (Preferred Reporting Items for Systematic reviews and Meta-Analyses extension for Scoping Reviews) workflow diagram. WOSCC: Web of Science Core Collection.</p>
        </caption>
        <graphic xlink:href="medinform_v12i1e60164_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
      </fig>
      <table-wrap position="float" id="table1">
        <label>Table 1</label>
        <caption>
          <p>Studies for pretraining language models (LMs) were reviewed by their data language.</p>
        </caption>
        <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="390"/>
          <col width="330"/>
          <col width="280"/>
          <thead>
            <tr valign="top">
              <td>Medical data language</td>
              <td>Reference</td>
              <td>Studies, n</td>
            </tr>
          </thead>
          <tbody>
            <tr valign="top">
              <td>English</td>
              <td>[<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref21">21</xref>-<xref ref-type="bibr" rid="ref25">25</xref>]</td>
              <td>7</td>
            </tr>
            <tr valign="top">
              <td>Chinese</td>
              <td>[<xref ref-type="bibr" rid="ref26">26</xref>-<xref ref-type="bibr" rid="ref29">29</xref>]</td>
              <td>4</td>
            </tr>
            <tr valign="top">
              <td>Brazilian Portuguese</td>
              <td>[<xref ref-type="bibr" rid="ref30">30</xref>,<xref ref-type="bibr" rid="ref31">31</xref>]</td>
              <td>2</td>
            </tr>
            <tr valign="top">
              <td>Spanish</td>
              <td>[<xref ref-type="bibr" rid="ref32">32</xref>]</td>
              <td>1</td>
            </tr>
            <tr valign="top">
              <td>European Portuguese</td>
              <td>[<xref ref-type="bibr" rid="ref33">33</xref>]</td>
              <td>1</td>
            </tr>
          </tbody>
        </table>
      </table-wrap>
      <fig id="figure2" position="float">
        <label>Figure 2</label>
        <caption>
          <p>Distribution of health care information extraction (IE) studies by topic. NER: named entity recognition.</p>
        </caption>
        <graphic xlink:href="medinform_v12i1e60164_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
      </fig>
      <sec>
        <title>Non-Portuguese Health Care Language Models</title>
        <p>A study by Zhou et al [<xref ref-type="bibr" rid="ref12">12</xref>] introduces CancerBERT, a domain-specific LM, that resulted from continuing the pretraining of the BlueBERT model [<xref ref-type="bibr" rid="ref34">34</xref>] with a cancer corpus, resulting in various checkpoints of CancerBERT. The evaluation was performed for the cancer phenotyping NER task, with the results showing that the CancerBERT model pretrained with the cancer corpus outperformed the checkpoint using the original BERT [<xref ref-type="bibr" rid="ref10">10</xref>] vocabulary.</p>
        <p>A similar approach was conducted in a study by Mao et al [<xref ref-type="bibr" rid="ref11">11</xref>], where the objective was to predict the risk of disease progression from Mild Cognitive Impairment to Alzheimer disease. A BERT model specifically tailored for Alzheimer disease (ie, AD-BERT) was pretrained with clinical notes, and its comparison with other models in experiments showed the benefits of domain adaptation.</p>
        <p>Within the same scope, the identification of fall incidents from EHRs is discussed in the study by Fu et al [<xref ref-type="bibr" rid="ref21">21</xref>]. A context-aware LM, BERT-based, was trained and integrated into a hybrid architecture along with post hoc heuristic rules. The performance of the BERT-based model was compared with DL methods, and the conclusions highlighted that the BERT model achieved superior results in identifying fall events.</p>
        <p>In a study by Wang et al [<xref ref-type="bibr" rid="ref26">26</xref>], a Chinese medical text corpus was used to pretrain BERT and obtain the Chinese BERT model. The results were aligned with previous studies, and domain adaptation demonstrated better results than traditional DL models and other pretrained LMs.</p>
        <p>Studies by Roitero et al [<xref ref-type="bibr" rid="ref22">22</xref>] and Agnikula Kshatriya et al [<xref ref-type="bibr" rid="ref23">23</xref>] once again mention the pretraining of BERT models on a medical corpus, achieving comparable or better performance than state-of-the-art models. In a study by Zhang et al [<xref ref-type="bibr" rid="ref24">24</xref>], an unsupervised adversarial domain adaptation framework with a pretrained LM for clinical event sequences is presented. Another example can be found in a study by Chen et al [<xref ref-type="bibr" rid="ref25">25</xref>], where a contextual LM is used in combination with rule-based preprocessing methods to develop a model for <italic>ICD-10</italic> (<italic>International Statistical Classification of Diseases, Tenth Revision</italic>) multilabel classification. The results demonstrate superiority over state-of-the-art models. Studies by Wen G et al and Wen C et al [<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref28">28</xref>] refer to the training of a domain-specific pretrained LM on unlabeled medical data, with the evaluation being made through NER.</p>
        <p>In the process of reviewing all the papers, we observed references to papers that aligned with our requirements despite not being explicitly included within our search query criteria. It is the case of studies by Zhang et al [<xref ref-type="bibr" rid="ref29">29</xref>] and Carrino et al [<xref ref-type="bibr" rid="ref32">32</xref>]. Carrino et al [<xref ref-type="bibr" rid="ref32">32</xref>] present a large-scale biomedical Spanish LM, where the models were pretrained from scratch, using a RoBERTa [<xref ref-type="bibr" rid="ref35">35</xref>] base model, and then fine-tuned on 3 clinical NER tasks. The comparison between general-domain and other available Spanish clinical models revealed the superiority of the models presented in the paper. Zhang et al [<xref ref-type="bibr" rid="ref29">29</xref>] share a similar scenario with BERT being pretrained on Chinese biomedical corpora, and MC-BERT, an in-domain LM, was developed. The results are consistent with previous studies, with MC-BERT outperforming BERT-based models in all evaluated tasks.</p>
      </sec>
      <sec>
        <title>Portuguese Health Care Language Models</title>
        <p>Our search query did not retrieve any studies for the Portuguese language. To address this scarcity of studies and since it is one of the objectives of this research, we carried out a broader search on Google Scholar [<xref ref-type="bibr" rid="ref36">36</xref>] to include studies that mentioned the creation of Portuguese health care LMs.</p>
        <p>The PT-BR language has already presented several studies, with BioBERTpt [<xref ref-type="bibr" rid="ref30">30</xref>] being one example. The authors used clinical notes and biomedical abstracts to pretrain 3 BERT-based checkpoints that were fine-tuned for the NER task to assess their performance. The results align with others, showing that the in-domain models achieved better performance. Another example is the study by Schneider et al [<xref ref-type="bibr" rid="ref31">31</xref>], where several clinical BERT-based checkpoints were developed resulting from the continuation of the pretraining of BERTimbau [<xref ref-type="bibr" rid="ref35">35</xref>], mBERT [<xref ref-type="bibr" rid="ref11">11</xref>], and all 3 BioBERTpt checkpoints on 150,000 clinical narratives from cardiology ambulatory. The results of fine-tuning for NER align with previous studies, demonstrating that the in-domain models outperformed general LMs.</p>
        <p>For the PT-PT language, we found the literature to be scarcer, with only 1 study being found that mentioned the continuation of the pretraining of an LM to achieve health care–domain LM. Coutinho and Martins [<xref ref-type="bibr" rid="ref33">33</xref>] propose a BERT-based model for assigning <italic>ICD-10</italic> codes to causes of death by using BERTimbau and continuing its pretraining with death certificates. The evaluation was made through NER, with all the checkpoints involved being fine-tuned for the classification task, and the findings indicated that transformer models could produce promising outcomes for health care tasks involving the analysis of relatively short documents.</p>
      </sec>
      <sec>
        <title>Health Care IE Models</title>
        <p>To better organize this section, we decided to categorize the studies by topic. Therefore, the first subsection presents NER studies where the authors attempted to automatically identify and extract medical information. The second subsection contains Assertion Status models, where entities are classified according to their status (present or absent), and finally, the third subsection presents studies that attempt to solve medical lexical problems.</p>
      </sec>
      <sec>
        <title>NER</title>
        <p>Zhou et al [<xref ref-type="bibr" rid="ref37">37</xref>] evaluated the performance of CancerBERT along with ML models for the breast cancer phenotype extraction task, with the results proving that CancerBERT has superior learning ability and generalizability for this task. Rahman et al [<xref ref-type="bibr" rid="ref38">38</xref>] refer to the use of BERT to identify the presence of a diagnosis in EHRs. With BERT’s ability to understand the context of text and based on conditions presented in EHRs, a pipeline was successfully designed to identify EHRs with the presence of a diagnosis, reducing the manual note review load. Crema et al [<xref ref-type="bibr" rid="ref39">39</xref>], use an Italian biomedical BERT model, fine-tuning it for the NER task with the entities of interest, including diagnoses, symptoms, drugs, and medical assessments, achieving an <italic>F</italic><sub>1</sub>-score of nearly 0.85 values. Entity-BERT was introduced in the study by Lu et al [<xref ref-type="bibr" rid="ref40">40</xref>], a DL-based model for entity IE that is capable of recognizing entities such as medical terminologies, disease names, or drug information. Zhang et al [<xref ref-type="bibr" rid="ref41">41</xref>] propose the combination of data augmentation and domain information using the Adapter Transformer Encoder Model for Clinical Event Detection. It uses the BioBERT model to generate word-level features, addressing the issue of many obscure professional terms in EMRs leading to poor recognition performance of the model. The results were reported to be superior to those of other existing models. A multilingual transformer was fine-tuned in a study by Kim et al [<xref ref-type="bibr" rid="ref42">42</xref>], where researchers successfully extracted alcohol-related information from unstructured clinical notes with an extraction accuracy of 0.84 as measured by the macro <italic>F</italic><sub>1</sub>-score. Kormilitzin et al [<xref ref-type="bibr" rid="ref43">43</xref>], initially pretrained a model on the task of predicting the next word and subsequently fine-tuned it for the NER task, extracting various categories of drugs and achieving performance with an <italic>F</italic><sub>1</sub>-score above 0.95 values. Solarte-Pabón et al [<xref ref-type="bibr" rid="ref44">44</xref>] evaluate the fine-tuning of several pretrained LMs for the NER task, aiming to identify breast cancer concepts in the Spanish language. The results show that BERT-based and RoBERTa-based LMs exhibit competitive performance on this task. Liu et al [<xref ref-type="bibr" rid="ref45">45</xref>] propose the use of BERT-BiLSTM-CRF for the NER task of rheumatoid arthritis vocabulary and then MC-BERT for the entity extraction task, with results showing <italic>F</italic><sub>1</sub>-scores above 90%. Wang et al [<xref ref-type="bibr" rid="ref46">46</xref>] compare the use of 4 pretrained transformer-based LMs fine-tuned for the NER task with a baseline regular expression model in order to extract ophthalmic examination components, demonstrating that transformers achieve superior results. In the study by Singh et al [<xref ref-type="bibr" rid="ref47">47</xref>], a pretrained transformer-based LM was fine-tuned with cardiac magnetic resonance imaging annotations to effectively extract measurements from clinical reports, and it achieved high extraction performance without requiring heuristics or expert annotations.</p>
        <p>Several studies focus on extracting information about family history, such as studies by Kim et al [<xref ref-type="bibr" rid="ref48">48</xref>], He et al [<xref ref-type="bibr" rid="ref49">49</xref>], Silva et al [<xref ref-type="bibr" rid="ref50">50</xref>], Dai et al [<xref ref-type="bibr" rid="ref51">51</xref>], and Zhan et al [<xref ref-type="bibr" rid="ref52">52</xref>]. They use ML methods, incorporating rule-based approaches, multitask-based artificial neural networks (ANN), attention-based neural networks, and even combinations such as convolutional neural networks (CNNs) BiLSTM and BERT. The goal was to automatically extract entities such as people’s names, residence, birth date, or death date, and in some cases, there is an additional subtask related to relation extraction, which involves identifying relationships between family members. Overall, the results have proven to be satisfactory, particularly in the NER task.</p>
        <p>CNNs are highly popular methods in the scientific community for extracting clinical information and studies by Yang et al [<xref ref-type="bibr" rid="ref53">53</xref>], Santus et al [<xref ref-type="bibr" rid="ref54">54</xref>], Mahajan and Rana [<xref ref-type="bibr" rid="ref55">55</xref>], and Landlosi et al [<xref ref-type="bibr" rid="ref56">56</xref>] primarily used them, often supplemented with rule-based approaches or feature optimization in some cases. The use of these methods lies in extracting clinical information from EHRs, tasks that could be time-consuming if done manually. Within the broader category of neural networks, RNNs are also a method used for IE in which the authors of studies [<xref ref-type="bibr" rid="ref57">57</xref>-<xref ref-type="bibr" rid="ref66">66</xref>] all use RNNs, with BiLSTM-CRF (Bidirectional Long Short-Term Memory - Conditional Random Field) being a very popular network among these studies. The main topics extracted include terms related to specific diseases, drug names with associated attributes (dosage, frequency, duration, route, and condition), adverse drug events, the presence of a diagnosis, or even important information in medical image reports, with the results globally proven to be promising.</p>
        <p>Studies [<xref ref-type="bibr" rid="ref67">67</xref>-<xref ref-type="bibr" rid="ref69">69</xref>] use ML methods, with the first focusing on automatically classifying the outcomes of specific tasks related to the clinical conditions of stroke survivors, the second aiming to extract useful information in abdominopelvic radiology reports, and the third one focused on extracting travel history mentions from clinical documents. In Malmasi et al [<xref ref-type="bibr" rid="ref70">70</xref>], the use of different methods to extract low-prevalence concepts is discussed, specifically in the case of insulin rejection by patients with attempts at both sentence-level and token-level approaches using ML and DL methods, but the results showed that it is challenging to automatically identify low-prevalence concepts. Similar proposals have been presented in studies [<xref ref-type="bibr" rid="ref71">71</xref>-<xref ref-type="bibr" rid="ref79">79</xref>] using spaCy’s [<xref ref-type="bibr" rid="ref80">80</xref>] pipeline for IE, contextual embeddings such as embeddings from language models (ELMo) [<xref ref-type="bibr" rid="ref81">81</xref>] and BERT, position-attention mechanisms, knowledge graph embeddings, word segmentation models, or even NLP models developed using Java for extracting medical information, for example, extracting details related to drugs, drug attributes, or diagnoses.</p>
        <p>In Lee and Uppal [<xref ref-type="bibr" rid="ref82">82</xref>], a web-based summarization and visualization tool is introduced for extracting salient information from clinical and biomedical text, featuring sentence ranking by relevance and facilitating early medical risk detection in clinical settings. Chen et al [<xref ref-type="bibr" rid="ref83">83</xref>] aimed to create a model to extract concept embeddings from EHRs for disease pattern retrieval and subsequent classification tasks.</p>
      </sec>
      <sec>
        <title>Assertion Status</title>
        <p>Sykes et al [<xref ref-type="bibr" rid="ref84">84</xref>] address the issue of negation and non-negation of clinical terms in EHRs. It is an Assertion Status case, in which the text can be characterized by cases where diseases are stated to be absent or only hypothesized. In this study, they propose various methods to address this issue, including rule-based, ML, or DL approaches, and all proposals yielded good results in a test set, achieving an <italic>F</italic><sub>1</sub>-score of more than 0.95. In Chaturvedi et al [<xref ref-type="bibr" rid="ref85">85</xref>], a corpus annotated with mentions of pain was developed, considering the presence or absence of pain. It is another example of an Assertion Status problem aimed at facilitating further studies using the corpus to better understand how pain is mentioned in clinical notes.</p>
      </sec>
      <sec>
        <title>Medical Lexical Problems</title>
        <p>From a different perspective, there have been studies focusing on medical lexical problems. Newman-Griffis et al [<xref ref-type="bibr" rid="ref86">86</xref>] discuss the presence of ambiguous words and attempts to normalize medical concepts to standardize vocabularies, while the study by Jaber et al [<xref ref-type="bibr" rid="ref87">87</xref>] addresses the problem of the frequent use of abbreviations by proposing a method, by fine-tuning a pretrained LM, to successfully disambiguate clinical abbreviations. Lee et al [<xref ref-type="bibr" rid="ref88">88</xref>] propose a typographical error correction model that considers context, based on a masked LM, to address the issue of typographical errors in real-world medical data. They conclude that typographical errors in unstructured text negatively impact the performance of NLP tasks, and their method is robust and applicable in real-world environments.</p>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>Continuing the pretraining of LMs to develop health care LMs has proven beneficial. The most common method to evaluate this approach is by fine-tuning both the baseline and the in-domain LM on downstream NLP tasks and comparing the results.</p>
        <p>In IE models, NER is the most popular topic aimed at automatically identifying and extracting medically relevant information. Transformers are the preferred technology for this purpose, with fine-tuning of medical LMs consistently achieving superior results.</p>
        <p>To conclude our SLR, we engaged in a deeper discussion divided into health care LMs and health care IE models.</p>
      </sec>
      <sec>
        <title>Health Care Language Models</title>
        <p>On a global scale, we have identified numerous studies that continued the pretraining of LMs to develop domain-specific LM, specifically medical LMs. In general, the findings across almost all of these studies substantiate the advantages of in-domain training before undertaking any other downstream tasks. The favorite evaluation task is NER, with almost every study mentioning the fine-tuning of LMs for the NER task.</p>
        <p>As shown in <xref ref-type="table" rid="table1">Table 1</xref>, English and Chinese are the languages with the most studies and published models due to the available resources in terms of data and hardware power. The level of domain adaptation for these languages is more advanced, with dedicated health care LMs developed for specific diseases such as Alzheimer Disease-BERT [<xref ref-type="bibr" rid="ref11">11</xref>] and CancerBERT [<xref ref-type="bibr" rid="ref12">12</xref>], which represent very focused domains. These studies offer advantages by achieving better performance in extracting specific concepts from textual data related to these diseases compared with general health care LMs.</p>
        <p>For non-English languages, the process is not so developed, which can be considered as expected since they have their known limitations, such as the scarcity of data and resources available. Nevertheless, there have been concerted efforts to create general health care LMs, underscoring the community’s recognition of the use of these models. The Portuguese language fits this context, and despite initial strides that have already been taken, there exists ample room for improvement, particularly in the context of PT-PT where the only published study is [<xref ref-type="bibr" rid="ref33">33</xref>], yet, to the best of our knowledge, the model is not publicly available.</p>
        <p>Non-English languages, particularly Portuguese, should draw inspiration from advancements and results in medical domain adaptation studies. Despite limited resources and available data, efforts should first focus on creating general medical LMs. In a subsequent phase, efforts should be directed toward narrowing down to specific diseases while performing domain adaptation. This approach ensures that knowledge previously acquired by the LMs is refined within the medical domain and then adapted to smaller medical domains without losing the previously acquired knowledge completely. This initiative aims to foster the development of AI technologies in Portuguese, thereby promoting health care equality and access in languages with fewer resources. These models can be further fine-tuned for medical NLP tasks, such as IE, aimed at automatically identifying or highlighting specific information or structuring medical information extracted from textual data for ML analysis to aid health care professionals.</p>
      </sec>
      <sec>
        <title>Health Care IE Models</title>
        <p>Several methods have been used to create health care IE models. The most common method is the use of transformers, followed by the application of other DL and ML methods (<xref ref-type="table" rid="table2">Table 2</xref>). As previously discussed, the most popular topic was NER, where authors attempted to identify and extract medically relevant information.</p>
        <p>The results indicate that the most successful approach involves using pretrained LMs fine-tuned for IE tasks, benefiting from the contextual understanding of the text to achieve better results. The most commonly identified entities were diagnoses or diseases and drugs, along with specific phenotypes related to certain diseases.</p>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Number of studies used per method.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="500"/>
            <col width="500"/>
            <thead>
              <tr valign="top">
                <td>Methods</td>
                <td>Articles</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Transformers</td>
                <td>16</td>
              </tr>
              <tr valign="top">
                <td>Other DL<sup>a</sup></td>
                <td>15</td>
              </tr>
              <tr valign="top">
                <td>RNN<sup>b</sup></td>
                <td>10</td>
              </tr>
              <tr valign="top">
                <td>Other ML<sup>c</sup></td>
                <td>9</td>
              </tr>
              <tr valign="top">
                <td>CNN<sup>d</sup></td>
                <td>5</td>
              </tr>
              <tr valign="top">
                <td>Rule-based</td>
                <td>4</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table2fn1">
              <p><sup>a</sup>DL: deep learning.</p>
            </fn>
            <fn id="table2fn2">
              <p><sup>b</sup>RNN: recurrent neural network.</p>
            </fn>
            <fn id="table2fn3">
              <p><sup>c</sup>ML: machine learning.</p>
            </fn>
            <fn id="table2fn4">
              <p><sup>d</sup>CNN: convolutional neural network.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>It is also relevant to mention that in our query, 2 studies were focused on Assertion Status. This task involves classification at the sentence level aimed at assessing an entity based on its presence or absence in the text. Examples of absence include negation or hypothesizing medical information. From another perspective, to address the problems presented by medical text, we also found 2 studies that propose solutions to disambiguate the multitude of abbreviations present in medical text and 1 study that presents a typo correction model. Both solutions aimed to improve text quality and seek to correct issues in the text that are considered inevitable by health care professionals. These 5 studies could also be seen as an improvement to NER results. The ones focused on correcting the text could be viewed as a preprocessing step that would enhance the understanding of the medical text, while the Assertion Status studies could help ascertain whether an identified entity is present or absent in a patient’s condition. When compared with the distribution of NER, these 2 topics lack development, as together, they account for only 10% of the health care IE studies found. The community would benefit from more studies using different technologies and identifying new challenges to be solved.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>Our SLR highlights the benefits of in-domain training for health care LMs and the effectiveness of transformers in IE tasks, addressing a research gap regarding the lack of studies on health care LMs. Transformers excel in NER, identifying diagnoses, diseases, drugs, and phenotypes. English and Chinese lead in research and LM development, while non-English languages such as Portuguese show promise but need exploration. Challenges include Assertion Status and text disambiguation, necessitating diverse methodologies and research in health care IE.</p>
        <p>We have identified several health care–domain LMs, but there is a clear gap for non-English languages where the data and resources available are low. There is much to improve in those languages, with Portuguese being an example. The benefits of creating a medical-domain LM are already proven, and the health care sector could benefit greatly from a symbiosis with AI. Therefore, non-English languages should be motivated by the scarce studies already published and try to replicate them for their own language in order to fill this existing gap.</p>
        <p>From another point of view, the use of transformers appears to be the better technique to automatically identify medical information. Despite the annotation process for any supervised learning task being very time-consuming, transformers achieve better results on fewer annotations, making their usage on new tasks relatively easier. This task also benefits from an in-domain medical LM. The entities most commonly extracted are diagnosis or disease, posology-related entities, symptoms, and phenotypes related to specific diseases.</p>
        <p>Despite our belief that this was the right choice, we highlight the 2 databases that we searched, and we acknowledge that, despite our best efforts, there is always a possibility that not all relevant papers will be found when formulating a query. These are the limitations of our study. The chosen timeframe may also limit the availability of relevant studies, even though we believe it is the right timeframe to include studies that establish the current state-of-the-art with new technologies. While we focused on the Portuguese language, we acknowledge that our conclusions cannot be generalized to all non-English languages. However, other languages with similar characteristics in terms of available data and resources can certainly gain insights from this SLR.</p>
        <p>Globally, the development and research in these topics for the English language are very advanced compared with non-English languages. In English, several studies have been presented that perform domain adaptation for smaller domains, such as specific-disease LMs, which have improved results in extracting medical information related to these diseases. The next steps should involve continuing the pretraining for different medical areas or diseases to ensure the most comprehensive coverage with LMs. In addition, fine-tuning the already available models to meet the specific requirements of health care professionals is essential.</p>
        <p>Non-English languages are still performing domain adaptation for general domains, such as medical or biomedical fields, and should be motivated by these studies to overcome the barriers inherent in their respective language. In the next step, they should focus on performing domain adaptation, aiming to narrow down to specific medical areas or diseases. They should strive to replicate studies on Assertion Status or even those focused on resolving the frequent presence of abbreviations and typos in the text. In non-English languages where there is a scarcity of available data, it would be beneficial to have open corpora, even if distributed under licenses that protect data privacy, to enable more researchers to develop models.</p>
        <p>These types of studies are important to assess and guide the development of non-English languages trying to bridge the gaps and capitalize on the opportunities provided by these technologies to promote equity and improve access to health care all over the world. The differences in the available data and resources are almost impossible to correct but at least should be minimized.</p>
        <p>This effort aims to harness AI to enhance health care by developing advanced LMs tailored for non-English languages, thereby supporting health care professionals with decision-making tools that alleviate their workload and improve patient care indirectly.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>PRISMA-ScR checklist.</p>
        <media xlink:href="medinform_v12i1e60164_app1.pdf" xlink:title="PDF File  (Adobe PDF File), 509 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">AI</term>
          <def>
            <p>artificial intelligence</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">ANN</term>
          <def>
            <p>artificial neural network</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">BERT</term>
          <def>
            <p>Bidirectional Encoder Representations from Transformers</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">BiLSTM-CRF</term>
          <def>
            <p>Bidirectional Long Short-Term Memory - Conditional Random Field</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">CNN</term>
          <def>
            <p>convolutional neural network</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">DL</term>
          <def>
            <p>deep learning</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">EHR</term>
          <def>
            <p>electronic health record</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">EMR</term>
          <def>
            <p>electronic medical record</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb9">ELMo</term>
          <def>
            <p>embeddings from language models</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb10">ICD-10</term>
          <def>
            <p>International Statistical Classification of Diseases, Tenth Revision</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb11">IE</term>
          <def>
            <p>information extraction</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb12">LLM</term>
          <def>
            <p>large language model</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb13">LM</term>
          <def>
            <p>language model</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb14">ML</term>
          <def>
            <p>machine learning</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb15">NER</term>
          <def>
            <p>named entity recognition</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb16">NLP</term>
          <def>
            <p>natural language processing</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb17">PRISMA-ScR</term>
          <def>
            <p>Preferred Reporting Items for Systematic reviews and Meta-Analyses extension for Scoping Reviews</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb18">PT-BR</term>
          <def>
            <p>Brazilian Portuguese</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb19">PT-PT</term>
          <def>
            <p>European Portuguese</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb20">RNN</term>
          <def>
            <p>recurrent neural network</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb21">SLR</term>
          <def>
            <p>systematic literature review</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb22">WOSCC</term>
          <def>
            <p>Web of Science Core Collection</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>MN’s work was supported by the project Blockchain.PT, (PRR RE-C05-i01.02: AGENDAS/ALIANÇAS VERDES PARA A INOVAÇÃO EMPRESARIAL).</p>
    </ack>
    <fn-group>
      <fn fn-type="con">
        <p>MN, JB, and LBE performed conceptualization. MN and LBE conducted the investigation. JB, JCF, and LBE performed supervision. JB, LBE, and JCF conducted validation. MN wrote the original draft. JB, JCF, and LBE performed review and editing.</p>
      </fn>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <collab>HealthTech</collab>
          </person-group>
          <source>How to navigate structured and unstructured data as a healthcare organization</source>
          <access-date>2024-06-14</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://healthtechmagazine.net/article/2023/05/structured-vs-unstructured-data-in-healthcare-perfcon">https://healthtechmagazine.net/article/2023/05/structured-vs-unstructured-data-in-healthcare-perfcon</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <collab>RBC Capital Markets</collab>
          </person-group>
          <source>Navigating the changing face of healthcare episode</source>
          <access-date>2023-10-30</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.rbccm.com/en/gib/healthcare/story.page">https://www.rbccm.com/en/gib/healthcare/story.page</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tayefi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ngo</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Chomutare</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Dalianis</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Salvi</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Budrionis</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Godtliebsen</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Challenges and opportunities beyond structured data in analysis of electronic health records</article-title>
          <source>WIREs Computational Stats</source>
          <year>2021</year>
          <volume>13</volume>
          <issue>6</issue>
          <fpage>e1549</fpage>
          <pub-id pub-id-type="doi">10.1002/wics.1549</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vaswani</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Shazeer</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Parmar</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Uszkoreit</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Jones</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Gomez</surname>
              <given-names>AN</given-names>
            </name>
            <name name-style="western">
              <surname>Kaiser</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Polosukhin</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>Attention is all you need</article-title>
          <source>Computer Science Computation and Language</source>
          <year>2023</year>
          <pub-id pub-id-type="doi">10.5860/choice.189890</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chernyavskiy</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ilvovsky</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Nakov</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Transformers: "The End of History" for NLP?</article-title>
          <source>Computer Science Computation and Language</source>
          <year>2021</year>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://arxiv.org/abs/2105.00813"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rokon</surname>
              <given-names>OF</given-names>
            </name>
          </person-group>
          <article-title>RNN vs. LSTM vs. Transformers: unraveling the secrets of sequential data processing</article-title>
          <source>Medium</source>
          <year>2023</year>
          <access-date>2024-05-20</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medium.com/@mroko001/rnn-vs-lstm-vs-transformers-unraveling-the-secrets-of-sequential-data-processing-c4541c4b09f">https://tinyurl.com/432k5mn5</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="web">
          <source>How do Transformers work? - Hugging Face NLP Course</source>
          <access-date>2023-12-06</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://huggingface.co/learn/nlp-course/chapter1/4">https://huggingface.co/learn/nlp-course/chapter1/4</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Farahani</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Voghoei</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Rasheed</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Arabnia</surname>
              <given-names>HR</given-names>
            </name>
          </person-group>
          <source>A brief review of domain adaptation</source>
          <year>2020</year>
          <access-date>2024-04-21</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://arxiv.org/abs/2010.03978">http://arxiv.org/abs/2010.03978</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Guo</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <source>On the domain adaptation and generalization of pretrained language models: a survey</source>
          <year>2022</year>
          <access-date>2024-04-21</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://arxiv.org/abs/2211.03154">http://arxiv.org/abs/2211.03154</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Devlin</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>M-W</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Toutanova</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>BERT: pre-training of deep bidirectional transformers for language understanding</article-title>
          <source>ACL Anthology</source>
          <year>2019</year>
          <pub-id pub-id-type="doi">10.5260/chara.21.2.8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mao</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Rasmussen</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Adekkanattu</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Pacheco</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Bonakdarpour</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Vassar</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Shen</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Jiang</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Pathak</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Luo</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>AD-BERT: using pre-trained language model to predict the progression from mild cognitive impairment to alzheimer's disease</article-title>
          <source>J Biomed Inform</source>
          <year>2023</year>
          <volume>144</volume>
          <fpage>104442</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(23)00163-6"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2023.104442</pub-id>
          <pub-id pub-id-type="medline">37429512</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(23)00163-6</pub-id>
          <pub-id pub-id-type="pmcid">PMC11131134</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>CancerBERT: a cancer domain-specific language model for extracting breast cancer phenotypes from electronic health records</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2022</year>
          <volume>29</volume>
          <issue>7</issue>
          <fpage>1208</fpage>
          <lpage>1216</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/35333345"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamia/ocac040</pub-id>
          <pub-id pub-id-type="medline">35333345</pub-id>
          <pub-id pub-id-type="pii">6554005</pub-id>
          <pub-id pub-id-type="pmcid">PMC9196678</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Xie</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Pei</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Tiwari</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Fu</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Pre-trained language models in biomedical domain: a systematic survey</article-title>
          <source>ACM Comput Surv</source>
          <year>2023</year>
          <volume>56</volume>
          <issue>3</issue>
          <fpage>1</fpage>
          <lpage>52</lpage>
          <pub-id pub-id-type="doi">10.1145/3611651</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="web">
          <source>A Inteligência Artificial na Saúde, uma Breve Perspectiva</source>
          <access-date>2024-05-18</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.ey.com/pt_pt/health/a-inteligencia-artificial-na-saude-uma-breve-perspectiva">https://www.ey.com/pt_pt/health/a-inteligencia-artificial-na-saude-uma-breve-perspectiva</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Moher</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Liberati</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Tetzlaff</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Altman</surname>
              <given-names>DG</given-names>
            </name>
            <collab>PRISMA Group</collab>
          </person-group>
          <article-title>Preferred reporting items for systematic reviews and meta-analyses: the PRISMA statement</article-title>
          <source>Int J Surg</source>
          <year>2010</year>
          <volume>8</volume>
          <issue>5</issue>
          <fpage>336</fpage>
          <lpage>341</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1743-9191(10)00040-3"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.ijsu.2010.02.007</pub-id>
          <pub-id pub-id-type="medline">20171303</pub-id>
          <pub-id pub-id-type="pii">S1743-9191(10)00040-3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="web">
          <source>Scopus - Document search</source>
          <access-date>2023-05-15</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.scopus.com/search/form.uri?display=basic#basic">https://www.scopus.com/search/form.uri?display=basic#basic</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="web">
          <article-title>Web of science core collection</article-title>
          <source>Clarivate</source>
          <access-date>2024-01-26</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://clarivate.com/products/scientific-and-academic-research/research-discovery-and-workflow-solutions/webofscience-platform/web-of-science-core-collection/">https://clarivate.com/products/scientific-and-academic-research/research-discovery-and-workflow-solutions/webofscience-platform/web-of-science-core-collection/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pranckutė</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Web of science (WoS) and scopus: The titans of bibliographic information in today’s academic world</article-title>
          <source>Publications</source>
          <year>2021</year>
          <volume>9</volume>
          <issue>1</issue>
          <fpage>12</fpage>
          <pub-id pub-id-type="doi">10.3390/publications9010012</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>A tale of two databases: the use of web of science and scopus in academic papers</article-title>
          <source>Scientometrics</source>
          <year>2020</year>
          <volume>123</volume>
          <issue>1</issue>
          <fpage>321</fpage>
          <lpage>335</lpage>
          <pub-id pub-id-type="doi">10.1007/s11192-020-03387-8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Page</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>McKenzie</surname>
              <given-names>JE</given-names>
            </name>
            <name name-style="western">
              <surname>Bossuyt</surname>
              <given-names>PM</given-names>
            </name>
            <name name-style="western">
              <surname>Boutron</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Hoffmann</surname>
              <given-names>TC</given-names>
            </name>
            <name name-style="western">
              <surname>Mulrow</surname>
              <given-names>CD</given-names>
            </name>
            <name name-style="western">
              <surname>Shamseer</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Tetzlaff</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Akl</surname>
              <given-names>EA</given-names>
            </name>
            <name name-style="western">
              <surname>Brennan</surname>
              <given-names>SE</given-names>
            </name>
            <name name-style="western">
              <surname>Chou</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Glanville</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Grimshaw</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Hróbjartsson</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Lalu</surname>
              <given-names>MM</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Loder</surname>
              <given-names>EW</given-names>
            </name>
            <name name-style="western">
              <surname>Mayo-Wilson</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>McDonald</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>McGuinness</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Stewart</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Thomas</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Tricco</surname>
              <given-names>AC</given-names>
            </name>
            <name name-style="western">
              <surname>Welch</surname>
              <given-names>VA</given-names>
            </name>
            <name name-style="western">
              <surname>Whiting</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Moher</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>The PRISMA 2020 statement: an updated guideline for reporting systematic reviews</article-title>
          <source>BMJ</source>
          <year>2021</year>
          <volume>372</volume>
          <fpage>n71</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.bmj.com/lookup/pmidlookup?view=long&amp;pmid=33782057"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/bmj.n71</pub-id>
          <pub-id pub-id-type="medline">33782057</pub-id>
          <pub-id pub-id-type="pmcid">PMC8005924</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Thorsteinsdottir</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Lopes</surname>
              <given-names>GS</given-names>
            </name>
            <name name-style="western">
              <surname>Pagali</surname>
              <given-names>SR</given-names>
            </name>
            <name name-style="western">
              <surname>LeBrasseur</surname>
              <given-names>NK</given-names>
            </name>
            <name name-style="western">
              <surname>Wen</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Rocca</surname>
              <given-names>WA</given-names>
            </name>
            <name name-style="western">
              <surname>Olson</surname>
              <given-names>JE</given-names>
            </name>
            <name name-style="western">
              <surname>Sauver</surname>
              <given-names>JS</given-names>
            </name>
            <name name-style="western">
              <surname>Sohn</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>A hybrid model to identify fall occurrence from electronic health records</article-title>
          <source>Int J Med Inf</source>
          <year>2022</year>
          <volume>162</volume>
          <fpage>104736</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/35316697"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.ijmedinf.2022.104736</pub-id>
          <pub-id pub-id-type="medline">35316697</pub-id>
          <pub-id pub-id-type="pii">S1386-5056(22)00050-8</pub-id>
          <pub-id pub-id-type="pmcid">PMC9448825</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Roitero</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Portelli</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Popescu</surname>
              <given-names>MH</given-names>
            </name>
            <name name-style="western">
              <surname>Mea</surname>
              <given-names>VD</given-names>
            </name>
          </person-group>
          <article-title>DiLBERT: cheap embeddings for disease related medical NLP</article-title>
          <source>IEEE Access</source>
          <year>2021</year>
          <volume>9</volume>
          <fpage>159714</fpage>
          <lpage>159723</lpage>
          <pub-id pub-id-type="doi">10.1109/access.2021.3131386</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Agnikula Kshatriya</surname>
              <given-names>BS</given-names>
            </name>
            <name name-style="western">
              <surname>Sagheb</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Wi</surname>
              <given-names>CI</given-names>
            </name>
            <name name-style="western">
              <surname>Yoon</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Seol</surname>
              <given-names>HY</given-names>
            </name>
            <name name-style="western">
              <surname>Juhn</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Sohn</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Identification of asthma control factor in clinical notes using a hybrid deep learning model</article-title>
          <source>BMC Med Inform Decis Mak</source>
          <year>2021</year>
          <volume>21</volume>
          <issue>Suppl 7</issue>
          <fpage>272</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedinformdecismak.biomedcentral.com/articles/10.1186/s12911-021-01633-4"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12911-021-01633-4</pub-id>
          <pub-id pub-id-type="medline">34753481</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12911-021-01633-4</pub-id>
          <pub-id pub-id-type="pmcid">PMC8579684</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Bui</surname>
              <given-names>AAT</given-names>
            </name>
          </person-group>
          <article-title>AdaDiag: adversarial domain adaptation of diagnostic prediction with clinical event sequences</article-title>
          <source>J Biomed Inform</source>
          <year>2022</year>
          <volume>134</volume>
          <fpage>104168</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(22)00179-4"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2022.104168</pub-id>
          <pub-id pub-id-type="medline">35987449</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(22)00179-4</pub-id>
          <pub-id pub-id-type="pmcid">PMC9580228</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>P-F</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>K-C</given-names>
            </name>
            <name name-style="western">
              <surname>Liao</surname>
              <given-names>W-C</given-names>
            </name>
            <name name-style="western">
              <surname>Lai</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>He</surname>
              <given-names>T-L</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>S-C</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>W-J</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>C-Y</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>Y-C</given-names>
            </name>
            <name name-style="western">
              <surname>Tsai</surname>
              <given-names>I-C</given-names>
            </name>
            <name name-style="western">
              <surname>Chiu</surname>
              <given-names>C-H</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>S-C</given-names>
            </name>
            <name name-style="western">
              <surname>Hung</surname>
              <given-names>F-M</given-names>
            </name>
          </person-group>
          <article-title>Automatic international classification of diseases coding system: deep contextualized language model with rule-based approaches</article-title>
          <source>JMIR Med Inform</source>
          <year>2022</year>
          <volume>10</volume>
          <issue>6</issue>
          <fpage>e37557</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2022/6/e37557/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/37557</pub-id>
          <pub-id pub-id-type="medline">35767353</pub-id>
          <pub-id pub-id-type="pii">v10i6e37557</pub-id>
          <pub-id pub-id-type="pmcid">PMC9282222</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Sheng</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Cloud-based intelligent self-diagnosis and department recommendation service using Chinese medical BERT</article-title>
          <source>J Cloud Comp</source>
          <year>2021</year>
          <volume>10</volume>
          <issue>1</issue>
          <pub-id pub-id-type="doi">10.1186/s13677-020-00218-2</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wen</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Hu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Cross domains adversarial learning for Chinese named entity recognition for online medical consultation</article-title>
          <source>J Biomed Inform</source>
          <year>2020</year>
          <volume>112</volume>
          <fpage>103608</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(20)30237-9"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2020.103608</pub-id>
          <pub-id pub-id-type="medline">33132138</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(20)30237-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wen</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Jia</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Medical named entity recognition from un-labelled medical records based on pre-trained language models and domain dictionary</article-title>
          <source>Data Intell</source>
          <year>2021</year>
          <volume>3</volume>
          <issue>3</issue>
          <fpage>402</fpage>
          <lpage>417</lpage>
          <pub-id pub-id-type="doi">10.1162/dint_a_00105</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Jia</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Yin</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Dong</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Gao</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Hua</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Conceptualized representation learning for Chinese biomedical text mining</article-title>
          <source>Computer Science Computation and Language</source>
          <year>2020</year>
          <access-date>2023-10-19</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://arxiv.org/abs/2008.10813">http://arxiv.org/abs/2008.10813</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Schneider</surname>
              <given-names>ETR</given-names>
            </name>
            <name name-style="western">
              <surname>de Souza</surname>
              <given-names>JVA</given-names>
            </name>
            <name name-style="western">
              <surname>Knafou</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Oliveira</surname>
              <given-names>LES</given-names>
            </name>
            <name name-style="western">
              <surname>Copara</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Gumiel</surname>
              <given-names>YB</given-names>
            </name>
            <name name-style="western">
              <surname>Oliveira</surname>
              <given-names>LFAD</given-names>
            </name>
            <name name-style="western">
              <surname>Paraiso</surname>
              <given-names>EC</given-names>
            </name>
            <name name-style="western">
              <surname>Teodoro</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Barra</surname>
              <given-names>CMCM</given-names>
            </name>
          </person-group>
          <article-title>BioBERTpt - a portuguese neural language model for clinical named entity recognition</article-title>
          <year>2020</year>
          <conf-name>Proceedings of the 3rd Clinical Natural Language Processing Workshop</conf-name>
          <conf-date>August 27, 2024</conf-date>
          <conf-loc>USA</conf-loc>
          <publisher-name>Association for Computational Linguistics</publisher-name>
          <fpage>65</fpage>
          <lpage>72</lpage>
          <pub-id pub-id-type="doi">10.18653/v1/2020.clinicalnlp-1.7</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Schneider</surname>
              <given-names>ETR</given-names>
            </name>
            <name name-style="western">
              <surname>Gumiel</surname>
              <given-names>YB</given-names>
            </name>
            <name name-style="western">
              <surname>De Souza</surname>
              <given-names>JVA</given-names>
            </name>
            <name name-style="western">
              <surname>Mie</surname>
              <given-names>ML</given-names>
            </name>
            <name name-style="western">
              <surname>Emanuel</surname>
              <given-names>SEOL</given-names>
            </name>
            <name name-style="western">
              <surname>De</surname>
              <given-names>SRM</given-names>
            </name>
            <name name-style="western">
              <surname>Antonio</surname>
              <given-names>GM</given-names>
            </name>
            <name name-style="western">
              <surname>Eduardo</surname>
              <given-names>KJ</given-names>
            </name>
            <name name-style="western">
              <surname>Teodoro</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Moro</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Paraiso</surname>
              <given-names>EC</given-names>
            </name>
          </person-group>
          <article-title>CardioBERTpt: transformer-based models for cardiology language representation in portuguese</article-title>
          <year>2023</year>
          <conf-name>Proceedings of the 2023 IEEE 36th International Symposium on Computer-Based Medical Systems (CBMS)</conf-name>
          <conf-date>June 22-24, 2023</conf-date>
          <conf-loc>L'Aquila, Italy</conf-loc>
          <fpage>378</fpage>
          <lpage>381</lpage>
          <pub-id pub-id-type="doi">10.1109/CBMS58004.2023.00247</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Carrino</surname>
              <given-names>CP</given-names>
            </name>
            <name name-style="western">
              <surname>Llop</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Pàmies</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Gutiérrez-Fandiño</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Armengol-Estapé</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Silveira-Ocampo</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Valencia</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Gonzalez-Agirre</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Villegas</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Pre-trained biomedical language models for clinical NLP in Spanish</article-title>
          <source>ACL Anthology</source>
          <year>2022</year>
          <fpage>193</fpage>
          <lpage>199</lpage>
          <pub-id pub-id-type="doi">10.18653/v1/2022.bionlp-1.19</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Coutinho</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Martins</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Transformer-based models for ICD-10 coding of death certificates with portuguese text</article-title>
          <source>J Biomed Inform</source>
          <year>2022</year>
          <volume>136</volume>
          <fpage>104232</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(22)00237-4"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2022.104232</pub-id>
          <pub-id pub-id-type="medline">36307020</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(22)00237-4</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Peng</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Yan</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>Transfer learning in biomedical natural Language processing: an evaluation of BERT and ELMo on ten benchmarking datasets</article-title>
          <source>Computer Science Computation and Language</source>
          <year>2019</year>
          <pub-id pub-id-type="doi">10.18653/v1/w19-5006</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Ott</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Goyal</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Du</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Joshi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Levy</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Lewis</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Zettlemoyer</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Stoyanov</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>RoBERTa: a robustly optimized BERT pretraining approach</article-title>
          <source>Annual Reviews</source>
          <year>2019</year>
          <volume>21</volume>
          <issue>2</issue>
          <fpage>8</fpage>
          <lpage>10</lpage>
          <pub-id pub-id-type="doi">10.5260/chara.21.2.8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="web">
          <source>Google Académico</source>
          <access-date>2023-11-03</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://scholar.google.com/">https://scholar.google.com/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Blaes</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>A cross-institutional evaluation on breast cancer phenotyping NLP algorithms on electronic health records</article-title>
          <source>Comput Struct Biotechnol J</source>
          <year>2023</year>
          <volume>22</volume>
          <fpage>32</fpage>
          <lpage>40</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S2001-0370(23)00293-3"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.csbj.2023.08.018</pub-id>
          <pub-id pub-id-type="medline">37680211</pub-id>
          <pub-id pub-id-type="pii">S2001-0370(23)00293-3</pub-id>
          <pub-id pub-id-type="pmcid">PMC10480628</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rahman</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Ye</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Mittendorf</surname>
              <given-names>KF</given-names>
            </name>
            <name name-style="western">
              <surname>Lenoue-Newton</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Micheel</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Wolber</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Osterman</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Fabbri</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Accelerated curation of checkpoint inhibitor-induced colitis cases from electronic health records</article-title>
          <source>JAMIA Open</source>
          <year>2023</year>
          <volume>6</volume>
          <issue>1</issue>
          <fpage>ooad017</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/37012912"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamiaopen/ooad017</pub-id>
          <pub-id pub-id-type="medline">37012912</pub-id>
          <pub-id pub-id-type="pii">ooad017</pub-id>
          <pub-id pub-id-type="pmcid">PMC10066800</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Crema</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Buonocore</surname>
              <given-names>TM</given-names>
            </name>
            <name name-style="western">
              <surname>Fostinelli</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Parimbelli</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Verde</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Fundarò</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Manera</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ramusino</surname>
              <given-names>MC</given-names>
            </name>
            <name name-style="western">
              <surname>Capelli</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Costa</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Binetti</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Bellazzi</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Redolfi</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Advancing italian biomedical information extraction with transformers-based models: methodological insights and multicenter practical application</article-title>
          <source>J Biomed Inform</source>
          <year>2023</year>
          <volume>148</volume>
          <fpage>104557</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://air.unimi.it/handle/2434/1032034"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2023.104557</pub-id>
          <pub-id pub-id-type="medline">38012982</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(23)00278-2</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Jiang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Shi</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zhong</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Gu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Huangfu</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Gong</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Application of entity-BERT model based on neuroscience and brain-like cognition in electronic medical record entity recognition</article-title>
          <source>Front Neurosci</source>
          <year>2023</year>
          <volume>17</volume>
          <fpage>1259652</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/37799340"/>
          </comment>
          <pub-id pub-id-type="doi">10.3389/fnins.2023.1259652</pub-id>
          <pub-id pub-id-type="medline">37799340</pub-id>
          <pub-id pub-id-type="pmcid">PMC10547885</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Qin</surname>
              <given-names>X</given-names>
            </name>
          </person-group>
          <article-title>Combining data augmentation and domain information with TENER model for clinical event detection</article-title>
          <source>BMC Med Inform Decis Mak</source>
          <year>2021</year>
          <volume>21</volume>
          <issue>Suppl 9</issue>
          <fpage>261</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedinformdecismak.biomedcentral.com/articles/10.1186/s12911-021-01618-3"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12911-021-01618-3</pub-id>
          <pub-id pub-id-type="medline">34789246</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12911-021-01618-3</pub-id>
          <pub-id pub-id-type="pmcid">PMC8596895</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>HK</given-names>
            </name>
            <name name-style="western">
              <surname>Park</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Park</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Choi</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>You</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Bae</surname>
              <given-names>YS</given-names>
            </name>
          </person-group>
          <article-title>Identifying alcohol-related information from unstructured bilingual clinical notes with multilingual transformers</article-title>
          <source>IEEE Access</source>
          <year>2023</year>
          <volume>11</volume>
          <fpage>16066</fpage>
          <lpage>16075</lpage>
          <pub-id pub-id-type="doi">10.1109/access.2023.3245523</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kormilitzin</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Vaci</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Nevado-Holgado</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Med7: a transferable clinical natural language processing model for electronic health records</article-title>
          <source>Artif Intell Med</source>
          <year>2021</year>
          <volume>118</volume>
          <fpage>102086</fpage>
          <pub-id pub-id-type="doi">10.1016/j.artmed.2021.102086</pub-id>
          <pub-id pub-id-type="medline">34412834</pub-id>
          <pub-id pub-id-type="pii">S0933-3657(21)00079-8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Solarte-Pabón</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Montenegro</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>García-Barragán</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Torrente</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Provencio</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Menasalvas</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Robles</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>Transformers for extracting breast cancer information from Spanish clinical narratives</article-title>
          <source>Artif Intell Med</source>
          <year>2023</year>
          <volume>143</volume>
          <fpage>102625</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S0933-3657(23)00139-2"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.artmed.2023.102625</pub-id>
          <pub-id pub-id-type="medline">37673566</pub-id>
          <pub-id pub-id-type="pii">S0933-3657(23)00139-2</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Xin</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Gao</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Automatic knowledge extraction from chinese electronic medical records and rheumatoid arthritis knowledge graph construction</article-title>
          <source>Quant Imaging Med Surg</source>
          <year>2023</year>
          <volume>13</volume>
          <issue>6</issue>
          <fpage>3873</fpage>
          <lpage>3890</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/37284084"/>
          </comment>
          <pub-id pub-id-type="doi">10.21037/qims-22-1158</pub-id>
          <pub-id pub-id-type="medline">37284084</pub-id>
          <pub-id pub-id-type="pii">qims-13-06-3873</pub-id>
          <pub-id pub-id-type="pmcid">PMC10240026</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>SY</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Hwang</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Hu</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Tao</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Hernandez-Boussard</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Leveraging weak supervision to perform named entity recognition in electronic health records progress notes to identify the ophthalmology exam</article-title>
          <source>Int J Med Inform</source>
          <year>2022</year>
          <volume>167</volume>
          <fpage>104864</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/36179600"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.ijmedinf.2022.104864</pub-id>
          <pub-id pub-id-type="medline">36179600</pub-id>
          <pub-id pub-id-type="pii">S1386-5056(22)00178-2</pub-id>
          <pub-id pub-id-type="pmcid">PMC9901505</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Singh</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Haimovich</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Reeder</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Khurshid</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Lau</surname>
              <given-names>ES</given-names>
            </name>
            <name name-style="western">
              <surname>Cunningham</surname>
              <given-names>JW</given-names>
            </name>
            <name name-style="western">
              <surname>Philippakis</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Anderson</surname>
              <given-names>CD</given-names>
            </name>
            <name name-style="western">
              <surname>Ho</surname>
              <given-names>JE</given-names>
            </name>
            <name name-style="western">
              <surname>Lubitz</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Batra</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>One clinician is all you need-cardiac magnetic resonance imaging measurement extraction: deep learning algorithm development</article-title>
          <source>JMIR Med Inform</source>
          <year>2022</year>
          <volume>10</volume>
          <issue>9</issue>
          <fpage>e38178</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2022/9/e38178/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/38178</pub-id>
          <pub-id pub-id-type="medline">35960155</pub-id>
          <pub-id pub-id-type="pii">v10i9e38178</pub-id>
          <pub-id pub-id-type="pmcid">PMC9526125</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Heider</surname>
              <given-names>PM</given-names>
            </name>
            <name name-style="western">
              <surname>Lally</surname>
              <given-names>IRH</given-names>
            </name>
            <name name-style="western">
              <surname>Meystre</surname>
              <given-names>SM</given-names>
            </name>
          </person-group>
          <article-title>A hybrid model for family history information identification and relation extraction: development and evaluation of an end-to-end information extraction system</article-title>
          <source>JMIR Med Inform</source>
          <year>2021</year>
          <volume>9</volume>
          <issue>4</issue>
          <fpage>e22797</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2021/4/e22797/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/22797</pub-id>
          <pub-id pub-id-type="medline">33885370</pub-id>
          <pub-id pub-id-type="pii">v9i4e22797</pub-id>
          <pub-id pub-id-type="pmcid">PMC8103307</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref49">
        <label>49</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>He</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Yao</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Construction of genealogical knowledge graphs from obituaries: multitask neural network extraction system</article-title>
          <source>J Med Internet Res</source>
          <year>2021</year>
          <volume>23</volume>
          <issue>8</issue>
          <fpage>e25670</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2021/8/e25670/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/25670</pub-id>
          <pub-id pub-id-type="medline">34346903</pub-id>
          <pub-id pub-id-type="pii">v23i8e25670</pub-id>
          <pub-id pub-id-type="pmcid">PMC8374669</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref50">
        <label>50</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Silva</surname>
              <given-names>JF</given-names>
            </name>
            <name name-style="western">
              <surname>Almeida</surname>
              <given-names>JR</given-names>
            </name>
            <name name-style="western">
              <surname>Matos</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Extraction of family history information from clinical notes: deep learning and heuristics approach</article-title>
          <source>JMIR Med Inform</source>
          <year>2020</year>
          <volume>8</volume>
          <issue>12</issue>
          <fpage>e22898</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2020/12/e22898/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/22898</pub-id>
          <pub-id pub-id-type="medline">33372893</pub-id>
          <pub-id pub-id-type="pii">v8i12e22898</pub-id>
          <pub-id pub-id-type="pmcid">PMC7803476</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref51">
        <label>51</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dai</surname>
              <given-names>H-J</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>Y-Q</given-names>
            </name>
            <name name-style="western">
              <surname>Nekkantti</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Jonnagaddala</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Family history information extraction with neural attention and an enhanced relation-side scheme: algorithm development and validation</article-title>
          <source>JMIR Med Inform</source>
          <year>2020</year>
          <volume>8</volume>
          <issue>12</issue>
          <fpage>e21750</fpage>
          <pub-id pub-id-type="doi">10.2196/21750</pub-id>
          <pub-id pub-id-type="medline">33258777</pub-id>
          <pub-id pub-id-type="pii">v8i12e21750</pub-id>
          <pub-id pub-id-type="pmcid">PMC7738250</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref52">
        <label>52</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhan</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Peng</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Xiong</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Fu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Novel graph-based model with biaffine attention for family history extraction from clinical text: modeling study</article-title>
          <source>JMIR Med Inform</source>
          <year>2021</year>
          <volume>9</volume>
          <issue>4</issue>
          <fpage>e23587</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2021/4/e23587/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/23587</pub-id>
          <pub-id pub-id-type="medline">33881405</pub-id>
          <pub-id pub-id-type="pii">v9i4e23587</pub-id>
          <pub-id pub-id-type="pmcid">PMC8100876</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref53">
        <label>53</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Pou-Prom</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Jones</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Banning</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Dai</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Mamdani</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Oh</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Antoniou</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Assessment of natural language processing methods for ascertaining the expanded disability status scale score from the electronic health records of patients with multiple sclerosis: algorithm development and validation study</article-title>
          <source>JMIR Med Inform</source>
          <year>2022</year>
          <volume>10</volume>
          <issue>1</issue>
          <fpage>e25157</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2022/1/e25157/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/25157</pub-id>
          <pub-id pub-id-type="medline">35019849</pub-id>
          <pub-id pub-id-type="pii">v10i1e25157</pub-id>
          <pub-id pub-id-type="pmcid">PMC8792771</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref54">
        <label>54</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Santus</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Yala</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Peck</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Soomro</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Faridi</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Mamshad</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Lanahan</surname>
              <given-names>CR</given-names>
            </name>
            <name name-style="western">
              <surname>Barzilay</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Hughes</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Do neural information extraction algorithms generalize across institutions?</article-title>
          <source>JCO Clin Cancer Inform</source>
          <year>2019</year>
          <volume>3</volume>
          <fpage>1</fpage>
          <lpage>8</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://ascopubs.org/doi/10.1200/CCI.18.00160?url_ver=Z39.88-2003&amp;rfr_id=ori:rid:crossref.org&amp;rfr_dat=cr_pub  0pubmed"/>
          </comment>
          <pub-id pub-id-type="doi">10.1200/CCI.18.00160</pub-id>
          <pub-id pub-id-type="medline">31310566</pub-id>
          <pub-id pub-id-type="pmcid">PMC6874001</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref55">
        <label>55</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mahajan</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Rana</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Feature optimization in CNN using MROA for disease classification</article-title>
          <source>IDT</source>
          <year>2023</year>
          <volume>17</volume>
          <issue>2</issue>
          <fpage>301</fpage>
          <lpage>315</lpage>
          <pub-id pub-id-type="doi">10.3233/idt-220097</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref56">
        <label>56</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Landolsi</surname>
              <given-names>MY</given-names>
            </name>
            <name name-style="western">
              <surname>Hlaoua</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Romdhane</surname>
              <given-names>LB</given-names>
            </name>
          </person-group>
          <article-title>Hybrid method to automatically extract medical document tree structure</article-title>
          <source>Eng Appl Artif Intell</source>
          <year>2023</year>
          <volume>120</volume>
          <fpage>105922</fpage>
          <pub-id pub-id-type="doi">10.1016/j.engappai.2023.105922</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref57">
        <label>57</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wunnava</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Qin</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Kakar</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Sen</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Rundensteiner</surname>
              <given-names>EA</given-names>
            </name>
            <name name-style="western">
              <surname>Kong</surname>
              <given-names>X</given-names>
            </name>
          </person-group>
          <article-title>Adverse drug event detection from electronic health records using hierarchical recurrent neural networks with dual-level embedding</article-title>
          <source>Drug Saf</source>
          <year>2019</year>
          <volume>42</volume>
          <issue>1</issue>
          <fpage>113</fpage>
          <lpage>122</lpage>
          <pub-id pub-id-type="doi">10.1007/s40264-018-0765-9</pub-id>
          <pub-id pub-id-type="medline">30649736</pub-id>
          <pub-id pub-id-type="pii">10.1007/s40264-018-0765-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref58">
        <label>58</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Viani</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Miller</surname>
              <given-names>TA</given-names>
            </name>
            <name name-style="western">
              <surname>Napolitano</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Priori</surname>
              <given-names>SG</given-names>
            </name>
            <name name-style="western">
              <surname>Savova</surname>
              <given-names>GK</given-names>
            </name>
            <name name-style="western">
              <surname>Bellazzi</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Sacchi</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Supervised methods to extract clinical events from cardiology reports in Italian</article-title>
          <source>J Biomed Inform</source>
          <year>2019</year>
          <volume>95</volume>
          <fpage>103219</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(19)30139-X"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2019.103219</pub-id>
          <pub-id pub-id-type="medline">31150777</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(19)30139-X</pub-id>
          <pub-id pub-id-type="pmcid">PMC6948016</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref59">
        <label>59</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Pang</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Pan</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Yuan</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Du</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Information extraction for intestinal cancer electronic medical records</article-title>
          <source>IEEE Access</source>
          <year>2020</year>
          <volume>8</volume>
          <fpage>125923</fpage>
          <lpage>125934</lpage>
          <pub-id pub-id-type="doi">10.1109/access.2020.3005684</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref60">
        <label>60</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ju</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Short</surname>
              <given-names>AD</given-names>
            </name>
            <name name-style="western">
              <surname>Thompson</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Bakerly</surname>
              <given-names>ND</given-names>
            </name>
            <name name-style="western">
              <surname>Gkoutos</surname>
              <given-names>GV</given-names>
            </name>
            <name name-style="western">
              <surname>Tsaprouni</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Ananiadou</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Annotating and detecting phenotypic information for chronic obstructive pulmonary disease</article-title>
          <source>JAMIA Open</source>
          <year>2019</year>
          <volume>2</volume>
          <issue>2</issue>
          <fpage>261</fpage>
          <lpage>271</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/31984360"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamiaopen/ooz009</pub-id>
          <pub-id pub-id-type="medline">31984360</pub-id>
          <pub-id pub-id-type="pii">ooz009</pub-id>
          <pub-id pub-id-type="pmcid">PMC6951876</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref61">
        <label>61</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lopes</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Teixeira</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Gonçalo Oliveira</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Comparing different methods for named entity recognition in portuguese neurology text</article-title>
          <source>J Med Syst</source>
          <year>2020</year>
          <volume>44</volume>
          <issue>4</issue>
          <fpage>77</fpage>
          <pub-id pub-id-type="doi">10.1007/s10916-020-1542-8</pub-id>
          <pub-id pub-id-type="medline">32112285</pub-id>
          <pub-id pub-id-type="pii">10.1007/s10916-020-1542-8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref62">
        <label>62</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Alfattni</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Belousov</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Peek</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Nenadic</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Extracting drug names and associated attributes from discharge summaries: text mining study</article-title>
          <source>JMIR Med Inform</source>
          <year>2021</year>
          <volume>9</volume>
          <issue>5</issue>
          <fpage>e24678</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2021/5/e24678/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/24678</pub-id>
          <pub-id pub-id-type="medline">33949962</pub-id>
          <pub-id pub-id-type="pii">v9i5e24678</pub-id>
          <pub-id pub-id-type="pmcid">PMC8135022</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref63">
        <label>63</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Dredze</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Weiner</surname>
              <given-names>JP</given-names>
            </name>
            <name name-style="western">
              <surname>Hernandez</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Kimura</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kharrazi</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Extraction of geriatric syndromes from electronic health record clinical notes: assessment of statistical natural language processing methods</article-title>
          <source>JMIR Med Inform</source>
          <year>2019</year>
          <volume>7</volume>
          <issue>1</issue>
          <fpage>e13039</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2019/1/e13039/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/13039</pub-id>
          <pub-id pub-id-type="medline">30862607</pub-id>
          <pub-id pub-id-type="pii">v7i1e13039</pub-id>
          <pub-id pub-id-type="pmcid">PMC6454337</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref64">
        <label>64</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Ren</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Fine-tuning ERNIE for chest abnormal imaging signs extraction</article-title>
          <source>J Biomed Inform</source>
          <year>2020</year>
          <volume>108</volume>
          <fpage>103492</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(20)30120-9"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2020.103492</pub-id>
          <pub-id pub-id-type="medline">32645382</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(20)30120-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref65">
        <label>65</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jouffroy</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Feldman</surname>
              <given-names>SF</given-names>
            </name>
            <name name-style="western">
              <surname>Lerner</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Rance</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Burgun</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Neuraz</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Hybrid deep learning for medication-related information extraction from clinical texts in French: MedExt algorithm development study</article-title>
          <source>JMIR Med Inform</source>
          <year>2021</year>
          <volume>9</volume>
          <issue>3</issue>
          <fpage>e17934</fpage>
          <pub-id pub-id-type="doi">10.2196/17934</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref66">
        <label>66</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Ma</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Entity recognition of Chinese medical text based on multi-head self-attention combined with BILSTM-CRF</article-title>
          <source>Math Biosci Eng</source>
          <year>2022</year>
          <volume>19</volume>
          <issue>3</issue>
          <fpage>2206</fpage>
          <lpage>2218</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.aimspress.com/article/10.3934/mbe.2022103"/>
          </comment>
          <pub-id pub-id-type="doi">10.3934/mbe.2022103</pub-id>
          <pub-id pub-id-type="medline">35240782</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref67">
        <label>67</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zanotto</surname>
              <given-names>BS</given-names>
            </name>
            <name name-style="western">
              <surname>Beck da Silva Etges</surname>
              <given-names>AP</given-names>
            </name>
            <name name-style="western">
              <surname>Dal Bosco</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Cortes</surname>
              <given-names>EG</given-names>
            </name>
            <name name-style="western">
              <surname>Ruschel</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>De Souza</surname>
              <given-names>AC</given-names>
            </name>
            <name name-style="western">
              <surname>Andrade</surname>
              <given-names>CMV</given-names>
            </name>
            <name name-style="western">
              <surname>Viegas</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Canuto</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Luiz</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Ouriques Martins</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Vieira</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Polanczyk</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>André Gonçalves</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Stroke outcome measurements from electronic medical records: cross-sectional study on the effectiveness of neural and nonneural classifiers</article-title>
          <source>JMIR Med Inform</source>
          <year>2021</year>
          <volume>9</volume>
          <issue>11</issue>
          <fpage>e29120</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2021/11/e29120/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/29120</pub-id>
          <pub-id pub-id-type="medline">34723829</pub-id>
          <pub-id pub-id-type="pii">v9i11e29120</pub-id>
          <pub-id pub-id-type="pmcid">PMC8593798</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref68">
        <label>68</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Steinkamp</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Chambers</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Lalevic</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Zafar</surname>
              <given-names>HM</given-names>
            </name>
            <name name-style="western">
              <surname>Cook</surname>
              <given-names>TS</given-names>
            </name>
          </person-group>
          <article-title>Toward complete structured information extraction from radiology reports using machine learning</article-title>
          <source>J Digit Imaging</source>
          <year>2019</year>
          <volume>32</volume>
          <issue>4</issue>
          <fpage>554</fpage>
          <lpage>564</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/31218554"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s10278-019-00234-y</pub-id>
          <pub-id pub-id-type="medline">31218554</pub-id>
          <pub-id pub-id-type="pii">10.1007/s10278-019-00234-y</pub-id>
          <pub-id pub-id-type="pmcid">PMC6646440</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref69">
        <label>69</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Peterson</surname>
              <given-names>KS</given-names>
            </name>
            <name name-style="western">
              <surname>Lewis</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Patterson</surname>
              <given-names>OV</given-names>
            </name>
            <name name-style="western">
              <surname>Chapman</surname>
              <given-names>AB</given-names>
            </name>
            <name name-style="western">
              <surname>Denhalter</surname>
              <given-names>DW</given-names>
            </name>
            <name name-style="western">
              <surname>Lye</surname>
              <given-names>PA</given-names>
            </name>
            <name name-style="western">
              <surname>Stevens</surname>
              <given-names>VW</given-names>
            </name>
            <name name-style="western">
              <surname>Gamage</surname>
              <given-names>SD</given-names>
            </name>
            <name name-style="western">
              <surname>Roselle</surname>
              <given-names>GA</given-names>
            </name>
            <name name-style="western">
              <surname>Wallace</surname>
              <given-names>KS</given-names>
            </name>
            <name name-style="western">
              <surname>Jones</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Automated travel history extraction from clinical notes for informing the detection of emergent infectious disease events: algorithm development and validation</article-title>
          <source>JMIR Public Health Surveill</source>
          <year>2021</year>
          <volume>7</volume>
          <issue>3</issue>
          <fpage>e26719</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://publichealth.jmir.org/2021/3/e26719/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/26719</pub-id>
          <pub-id pub-id-type="medline">33759790</pub-id>
          <pub-id pub-id-type="pii">v7i3e26719</pub-id>
          <pub-id pub-id-type="pmcid">PMC7993087</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref70">
        <label>70</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Malmasi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Ge</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Hosomura</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Turchin</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Comparing information extraction techniques for low-prevalence concepts: The case of insulin rejection by patients</article-title>
          <source>J Biomed Inform</source>
          <year>2019</year>
          <volume>99</volume>
          <fpage>103306</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(19)30225-4"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2019.103306</pub-id>
          <pub-id pub-id-type="medline">31618679</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(19)30225-4</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref71">
        <label>71</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Hao</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Zou</surname>
              <given-names>VZ</given-names>
            </name>
            <name name-style="western">
              <surname>Hollander</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Ng</surname>
              <given-names>RT</given-names>
            </name>
            <name name-style="western">
              <surname>Isaac</surname>
              <given-names>KV</given-names>
            </name>
          </person-group>
          <article-title>Automated medical chart review for breast cancer outcomes research: a novel natural language processing extraction system</article-title>
          <source>BMC Med Res Methodol</source>
          <year>2022</year>
          <volume>22</volume>
          <issue>1</issue>
          <fpage>136</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedresmethodol.biomedcentral.com/articles/10.1186/s12874-022-01583-z"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12874-022-01583-z</pub-id>
          <pub-id pub-id-type="medline">35549854</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12874-022-01583-z</pub-id>
          <pub-id pub-id-type="pmcid">PMC9101856</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref72">
        <label>72</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sterckx</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Vandewiele</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Dehaene</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Janssens</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Ongenae</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>De Backere</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>De Turck</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Roelens</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Decruyenaere</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Van Hoecke</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Demeester</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Clinical information extraction for preterm birth risk prediction</article-title>
          <source>J Biomed Inform</source>
          <year>2020</year>
          <volume>110</volume>
          <fpage>103544</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(20)30172-6"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2020.103544</pub-id>
          <pub-id pub-id-type="medline">32858168</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(20)30172-6</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref73">
        <label>73</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cen</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Yuan</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Pan</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Ma</surname>
              <given-names>Q</given-names>
            </name>
          </person-group>
          <article-title>Contextual embedding bootstrapped neural network for medical information extraction of coronary artery disease records</article-title>
          <source>Med Biol Eng Comput</source>
          <year>2021</year>
          <volume>59</volume>
          <issue>5</issue>
          <fpage>1111</fpage>
          <lpage>1121</lpage>
          <pub-id pub-id-type="doi">10.1007/s11517-021-02359-1</pub-id>
          <pub-id pub-id-type="medline">33893606</pub-id>
          <pub-id pub-id-type="pii">10.1007/s11517-021-02359-1</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref74">
        <label>74</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dandala</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Joopudi</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Tsou</surname>
              <given-names>CH</given-names>
            </name>
            <name name-style="western">
              <surname>Liang</surname>
              <given-names>JJ</given-names>
            </name>
            <name name-style="western">
              <surname>Suryanarayanan</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Extraction of information related to drug safety surveillance from electronic health record notes: joint modeling of entities and relations using knowledge-aware neural attentive models</article-title>
          <source>JMIR Med Inform</source>
          <year>2020</year>
          <volume>8</volume>
          <issue>7</issue>
          <fpage>e18417</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2020/7/e18417/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/18417</pub-id>
          <pub-id pub-id-type="medline">32459650</pub-id>
          <pub-id pub-id-type="pii">v8i7e18417</pub-id>
          <pub-id pub-id-type="pmcid">PMC7382020</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref75">
        <label>75</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Guo</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Duan</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Yao</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Shang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Xing</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Moving toward a standardized diagnostic statement of pituitary adenoma using an information extraction model: a real-world study based on electronic medical records</article-title>
          <source>BMC Med Inform Decis Mak</source>
          <year>2022</year>
          <volume>22</volume>
          <issue>1</issue>
          <fpage>319</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedinformdecismak.biomedcentral.com/articles/10.1186/s12911-022-02031-0"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12911-022-02031-0</pub-id>
          <pub-id pub-id-type="medline">36476365</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12911-022-02031-0</pub-id>
          <pub-id pub-id-type="pmcid">PMC9727982</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref76">
        <label>76</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kraljevic</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Searle</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Shek</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Roguski</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Noor</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Bean</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Mascio</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Folarin</surname>
              <given-names>AA</given-names>
            </name>
            <name name-style="western">
              <surname>Roberts</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Bendayan</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Richardson</surname>
              <given-names>MP</given-names>
            </name>
            <name name-style="western">
              <surname>Stewart</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Shah</surname>
              <given-names>AD</given-names>
            </name>
            <name name-style="western">
              <surname>Wong</surname>
              <given-names>WK</given-names>
            </name>
            <name name-style="western">
              <surname>Ibrahim</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Teo</surname>
              <given-names>JT</given-names>
            </name>
            <name name-style="western">
              <surname>Dobson</surname>
              <given-names>RJB</given-names>
            </name>
          </person-group>
          <article-title>Multi-domain clinical natural language processing with MedCAT: The medical concept annotation toolkit</article-title>
          <source>Artif Intell Med</source>
          <year>2021</year>
          <volume>117</volume>
          <fpage>102083</fpage>
          <pub-id pub-id-type="doi">10.1016/j.artmed.2021.102083</pub-id>
          <pub-id pub-id-type="medline">34127232</pub-id>
          <pub-id pub-id-type="pii">S0933-3657(21)00076-2</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref77">
        <label>77</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dewaswala</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Bhopalwala</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Kaggal</surname>
              <given-names>VC</given-names>
            </name>
            <name name-style="western">
              <surname>Murphy</surname>
              <given-names>SP</given-names>
            </name>
            <name name-style="western">
              <surname>Bos</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Geske</surname>
              <given-names>JB</given-names>
            </name>
            <name name-style="western">
              <surname>Gersh</surname>
              <given-names>BJ</given-names>
            </name>
            <name name-style="western">
              <surname>Ommen</surname>
              <given-names>SR</given-names>
            </name>
            <name name-style="western">
              <surname>Araoz</surname>
              <given-names>PA</given-names>
            </name>
            <name name-style="western">
              <surname>Ackerman</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Arruda-Olson</surname>
              <given-names>AM</given-names>
            </name>
          </person-group>
          <article-title>Natural language processing for identification of hypertrophic cardiomyopathy patients from cardiac magnetic resonance reports</article-title>
          <source>BMC Med Inform Decis Mak</source>
          <year>2022</year>
          <volume>22</volume>
          <issue>1</issue>
          <fpage>272</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedinformdecismak.biomedcentral.com/articles/10.1186/s12911-022-02017-y"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12911-022-02017-y</pub-id>
          <pub-id pub-id-type="medline">36258218</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12911-022-02017-y</pub-id>
          <pub-id pub-id-type="pmcid">PMC9580188</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref78">
        <label>78</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Song</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Shao</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Ding</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Using natural language processing to extract clinically useful information from chinese electronic medical records</article-title>
          <source>Int J Med Inform</source>
          <year>2019</year>
          <volume>124</volume>
          <fpage>6</fpage>
          <lpage>12</lpage>
          <pub-id pub-id-type="doi">10.1016/j.ijmedinf.2019.01.004</pub-id>
          <pub-id pub-id-type="medline">30784428</pub-id>
          <pub-id pub-id-type="pii">S1386-5056(18)30594-X</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref79">
        <label>79</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Lv</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Research on named entity recognition of chinese electronic medical records based on multi-head attention mechanism and character-word information fusion</article-title>
          <source>IFS</source>
          <year>2022</year>
          <volume>42</volume>
          <issue>4</issue>
          <fpage>4105</fpage>
          <lpage>4116</lpage>
          <pub-id pub-id-type="doi">10.3233/jifs-212495</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref80">
        <label>80</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <collab>spaCy</collab>
          </person-group>
          <source>Language processing pipelines</source>
          <access-date>2023-11-01</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://spacy.io/usage/processing-pipelines/">https://spacy.io/usage/processing-pipelines/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref81">
        <label>81</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Peters</surname>
              <given-names>ME</given-names>
            </name>
            <name name-style="western">
              <surname>Neumann</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Iyyer</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Gardner</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Clark</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Zettlemoyer</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <person-group person-group-type="editor">
            <name name-style="western">
              <surname>Walker</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ji</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Stent</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Deep contextualized word representations</article-title>
          <source>Proceedings of the 2018 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, Volume 1 (Long Papers)</source>
          <year>2018</year>
          <publisher-loc>New Orleans, Louisiana</publisher-loc>
          <publisher-name>Association for Computational Linguistics</publisher-name>
          <fpage>2227</fpage>
          <lpage>2237</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref82">
        <label>82</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>EK</given-names>
            </name>
            <name name-style="western">
              <surname>Uppal</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>CERC: an interactive content extraction, recognition, and construction tool for clinical and biomedical text</article-title>
          <source>BMC Med Inform Decis Mak</source>
          <year>2020</year>
          <volume>20</volume>
          <issue>Suppl 14</issue>
          <fpage>306</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedinformdecismak.biomedcentral.com/articles/10.1186/s12911-020-01330-8"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12911-020-01330-8</pub-id>
          <pub-id pub-id-type="medline">33323109</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12911-020-01330-8</pub-id>
          <pub-id pub-id-type="pmcid">PMC7739454</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref83">
        <label>83</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Y-P</given-names>
            </name>
            <name name-style="western">
              <surname>Lo</surname>
              <given-names>Y-H</given-names>
            </name>
            <name name-style="western">
              <surname>Lai</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>C-H</given-names>
            </name>
          </person-group>
          <article-title>Disease concept-embedding based on the self-supervised method for medical information extraction from electronic health records and disease retrieval: algorithm development and validation study</article-title>
          <source>J Med Internet Res</source>
          <year>2021</year>
          <volume>23</volume>
          <issue>1</issue>
          <fpage>e25113</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2021/1/e25113/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/25113</pub-id>
          <pub-id pub-id-type="medline">33502324</pub-id>
          <pub-id pub-id-type="pii">v23i1e25113</pub-id>
          <pub-id pub-id-type="pmcid">PMC7875703</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref84">
        <label>84</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sykes</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Grivas</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Grover</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Tobin</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Sudlow</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Whiteley</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Mcintosh</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Whalley</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Alex</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Comparison of rule-based and neural network models for negation detection in radiology reports</article-title>
          <source>Nat Lang Eng</source>
          <year>2021</year>
          <volume>27</volume>
          <issue>2</issue>
          <fpage>203</fpage>
          <lpage>224</lpage>
          <pub-id pub-id-type="doi">10.1017/s1351324920000509</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref85">
        <label>85</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chaturvedi</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chance</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Mirza</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Vernugopan</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Velupillai</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Stewart</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Roberts</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Development of a corpus annotated with mentions of pain in mental health records: natural language processing approach</article-title>
          <source>JMIR Form Res</source>
          <year>2023</year>
          <volume>7</volume>
          <fpage>e45849</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://formative.jmir.org/2023//e45849/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/45849</pub-id>
          <pub-id pub-id-type="medline">37358897</pub-id>
          <pub-id pub-id-type="pii">v7i1e45849</pub-id>
          <pub-id pub-id-type="pmcid">PMC10337440</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref86">
        <label>86</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Newman-Griffis</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Divita</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Desmet</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Zirikly</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Rosé</surname>
              <given-names>CP</given-names>
            </name>
            <name name-style="western">
              <surname>Fosler-Lussier</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Ambiguity in medical concept normalization: an analysis of types and coverage in electronic health record datasets</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2021</year>
          <volume>28</volume>
          <issue>3</issue>
          <fpage>516</fpage>
          <lpage>532</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/33319905"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamia/ocaa269</pub-id>
          <pub-id pub-id-type="medline">33319905</pub-id>
          <pub-id pub-id-type="pii">6034899</pub-id>
          <pub-id pub-id-type="pmcid">PMC7936394</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref87">
        <label>87</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jaber</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Martínez</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Disambiguating clinical abbreviations using a one-fits-all classifier based on deep learning techniques</article-title>
          <source>Methods Inf Med</source>
          <year>2022</year>
          <volume>61</volume>
          <issue>S 01</issue>
          <fpage>e28</fpage>
          <lpage>e34</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.thieme-connect.com/DOI/DOI?10.1055/s-0042-1742388"/>
          </comment>
          <pub-id pub-id-type="doi">10.1055/s-0042-1742388</pub-id>
          <pub-id pub-id-type="medline">35104909</pub-id>
          <pub-id pub-id-type="pmcid">PMC9246508</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref88">
        <label>88</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>EB</given-names>
            </name>
            <name name-style="western">
              <surname>Heo</surname>
              <given-names>GE</given-names>
            </name>
            <name name-style="western">
              <surname>Choi</surname>
              <given-names>CM</given-names>
            </name>
            <name name-style="western">
              <surname>Song</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>MLM-based typographical error correction of unstructured medical texts for named entity recognition</article-title>
          <source>BMC Bioinformatics</source>
          <year>2022</year>
          <volume>23</volume>
          <issue>1</issue>
          <fpage>486</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcbioinformatics.biomedcentral.com/articles/10.1186/s12859-022-05035-9"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12859-022-05035-9</pub-id>
          <pub-id pub-id-type="medline">36384464</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12859-022-05035-9</pub-id>
          <pub-id pub-id-type="pmcid">PMC9670595</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
