<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMI</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Med Inform</journal-id>
      <journal-title>JMIR Medical Informatics</journal-title>
      <issn pub-type="epub">2291-9694</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v11i1e44892</article-id>
      <article-id pub-id-type="pmid">37796584</article-id>
      <article-id pub-id-type="doi">10.2196/44892</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>A Multilabel Text Classifier of Cancer Literature at the Publication Level: Methods Study of Medical Text Classification</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Benis</surname>
            <given-names>Arriel</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Ben-Miled</surname>
            <given-names>Zina</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Guo</surname>
            <given-names>Lei</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Zhang</surname>
            <given-names>Ying</given-names>
          </name>
          <degrees>MA</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-5858-801X</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Li</surname>
            <given-names>Xiaoying</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-4407-6616</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Liu</surname>
            <given-names>Yi</given-names>
          </name>
          <degrees>MA</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-8188-6277</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Li</surname>
            <given-names>Aihua</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-6742-3268</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Yang</surname>
            <given-names>Xuemei</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-2927-4166</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Tang</surname>
            <given-names>Xiaoli</given-names>
          </name>
          <degrees>MA</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Institute of Medical Information</institution>
            <institution>Chinese Academy of Medical Sciences</institution>
            <addr-line>No 69, Dongdan North Street</addr-line>
            <addr-line>Beijing, 100020</addr-line>
            <country>China</country>
            <phone>86 10 52328902</phone>
            <email>tang.xiaoli@imicams.ac.cn</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-6946-3482</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Institute of Medical Information</institution>
        <institution>Chinese Academy of Medical Sciences</institution>
        <addr-line>Beijing</addr-line>
        <country>China</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Xiaoli Tang <email>tang.xiaoli@imicams.ac.cn</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2023</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>5</day>
        <month>10</month>
        <year>2023</year>
      </pub-date>
      <volume>11</volume>
      <elocation-id>e44892</elocation-id>
      <history>
        <date date-type="received">
          <day>7</day>
          <month>12</month>
          <year>2022</year>
        </date>
        <date date-type="rev-request">
          <day>11</day>
          <month>1</month>
          <year>2023</year>
        </date>
        <date date-type="rev-recd">
          <day>7</day>
          <month>3</month>
          <year>2023</year>
        </date>
        <date date-type="accepted">
          <day>6</day>
          <month>9</month>
          <year>2023</year>
        </date>
      </history>
      <copyright-statement>©Ying Zhang, Xiaoying Li, Yi Liu, Aihua Li, Xuemei Yang, Xiaoli Tang. Originally published in JMIR Medical Informatics (https://medinform.jmir.org), 05.10.2023.</copyright-statement>
      <copyright-year>2023</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Informatics, is properly cited. The complete bibliographic information, a link to the original publication on https://medinform.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://medinform.jmir.org/2023/1/e44892" xlink:type="simple"/>
      <related-article related-article-type="correction-forward" xlink:title="This is a corrected version. See correction statement in:" xlink:href="http://medinform.jmir.org/2024/1/e62757/" vol="12" page="e62757"> </related-article>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Given the threat posed by cancer to human health, there is a rapid growth in the volume of data in the cancer field and interdisciplinary and collaborative research is becoming increasingly important for fine-grained classification. The low-resolution classifier of reported studies at the journal level fails to satisfy advanced searching demands, and a single label does not adequately characterize the literature originated from interdisciplinary research results. There is thus a need to establish a multilabel classifier with higher resolution to support literature retrieval for cancer research and reduce the burden of screening papers for clinical relevance.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>The primary objective of this research was to address the low-resolution issue of cancer literature classification due to the ambiguity of the existing journal-level classifier in order to support gaining high-relevance evidence for clinical consideration and all-sided results for literature retrieval.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>We trained a multilabel classifier with scalability for classifying the literature on cancer research directly at the publication level to assign proper content-derived labels based on the “Bidirectional Encoder Representation from Transformers (BERT) + X” model and obtain the best option for X. First, a corpus of 70,599 cancer publications retrieved from the Dimensions database was divided into a training and a testing set in a ratio of 7:3. Second, using the classification terminology of International Cancer Research Partnership cancer types, we compared the performance of classifiers developed using BERT and 5 classical deep learning models, such as the text recurrent neural network (TextRNN) and FastText, followed by metrics analysis.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>After comparing various combined deep learning models, we obtained a classifier based on the optimal combination “BERT + TextRNN,” with a precision of 93.09%, a recall of 87.75%, and an <italic>F</italic><sub>1</sub>-score of 90.34%. Moreover, we quantified the distinctive characteristics in the text structure and multilabel distribution in order to generalize the model to other fields with similar characteristics.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>The “BERT + TextRNN” model was trained for high-resolution classification of cancer literature at the publication level to support accurate retrieval and academic statistics. The model automatically assigns 1 or more labels to each cancer paper, as required. Quantitative comparison verified that the “BERT + TextRNN” model is the best fit for multilabel classification of cancer literature compared to other models. More data from diverse fields will be collected to testify the scalability and extensibility of the proposed model in the future.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>text classification</kwd>
        <kwd>publication-level classifier</kwd>
        <kwd>cancer literature</kwd>
        <kwd>deep learning</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <sec>
        <title>Background</title>
        <p>According to the World Health Organization (WHO) reports, cancer is one of the leading causes of death worldwide, accounting for nearly 10 million deaths in 2020 [<xref ref-type="bibr" rid="ref1">1</xref>]. With cancer emerging as the greatest threat to human life, there is a rapid growth in the volume of literature published in the cancer field. The trend of disciplinary convergence has led to publications requiring labels from multiple subjects. Consequently, there is increasingly more demand for accurate cancer literature classification for retrieval, evidence support, academic analysis, and statistical evaluation in order to support clinical research, precision medicine, and discovery of interdisciplinary cancer research [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref3">3</xref>] by forecasting trends and hotspot statistics.</p>
        <p>Text classification is the process of assigning specific labels to the literature based on individual features. The current methods of classifying the literature can be divided into 3 groups: mapping based, subject information based, and machine learning based [<xref ref-type="bibr" rid="ref4">4</xref>-<xref ref-type="bibr" rid="ref6">6</xref>]. Recently, an increasing number of studies have experimented with deep learning to enhance the effects of text classification [<xref ref-type="bibr" rid="ref4">4</xref>]. Most of the existing literature classification (eg, Web of Science, Scopus [<xref ref-type="bibr" rid="ref7">7</xref>-<xref ref-type="bibr" rid="ref11">11</xref>]) is usually carried out at the journal level, that is, all papers in a given journal get the same labeling categories as the hosted journal. However, given that interdisciplinary research is increasing in the cancer field [<xref ref-type="bibr" rid="ref12">12</xref>], there is a need for a more precise classifier, as papers from a journal always present a diverse range of topics [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref14">14</xref>]. Moreover, literature classification at the journal level can no longer adapt to the dynamics of newly developing subjects and fully characterize text features.</p>
      </sec>
      <sec>
        <title>Related Works</title>
        <sec>
          <title>Development of Text Classification Technology</title>
          <p>Text classification technology has undergone rapid development from expert systems to machine learning to finally deep learning [<xref ref-type="bibr" rid="ref15">15</xref>]. Maron [<xref ref-type="bibr" rid="ref16">16</xref>] published the first paper on automatic text classification in 1961. By the end of the 20th century, machine learning had matured into a fully developed field [<xref ref-type="bibr" rid="ref17">17</xref>]. Joachims [<xref ref-type="bibr" rid="ref18">18</xref>] established the bag-of-words model to transform text into a vector with a fixed length and then selected features using the information gain criterion to achieve dimensionality reduction, eventually training the feature vector iteratively using a support vector machine (SVM) classifier. Rasjid [<xref ref-type="bibr" rid="ref19">19</xref>] focused on data classification using k-nearest neighbors (k-NN) and naive Bayes. Liang et al [<xref ref-type="bibr" rid="ref20">20</xref>] improved the feature recognition of the literature using appropriate clusters and the introduction of differential latent semantics index (DLSI) spaces. In 2006, with the rapid development of deep learning, text classification research based on deep learning gradually replaced traditional machine learning methods and became the mainstream, with wide applications in numerous tasks [<xref ref-type="bibr" rid="ref4">4</xref>].</p>
          <p>The deep learning–based text classification method adopts word vectors (eg, GloVe [<xref ref-type="bibr" rid="ref21">21</xref>] and word2vec [<xref ref-type="bibr" rid="ref22">22</xref>]) for word semantic representation [<xref ref-type="bibr" rid="ref23">23</xref>], and subsequently, various deep neural network (DNN)–based text classification methods develop. Convolutional neural networks (CNNs) [<xref ref-type="bibr" rid="ref24">24</xref>] were originally constructed for image processing and have been broadly used for text classification [<xref ref-type="bibr" rid="ref25">25</xref>-<xref ref-type="bibr" rid="ref27">27</xref>]. Due to the computational complexity, deep network gradient disappearance, and short text content of a CNN, a series of optimized models were gradually derived to address these issues, including FastText [<xref ref-type="bibr" rid="ref28">28</xref>], deep pyramid convolutional neural networks (DPCNNs) [<xref ref-type="bibr" rid="ref29">29</xref>], knowledge pyramid convolutional neural networks (KPCNNs) [<xref ref-type="bibr" rid="ref30">30</xref>], and text convolutional neural networks (TextCNNs) [<xref ref-type="bibr" rid="ref26">26</xref>]. Especially, the TextCNN is a simple, shallow network and requires only a small number of hyperparameters for fine-tuning. Compared with CNNs, recurrent neural networks (RNNs) can easily implement multilayer superposition to construct a multilayer neural network [<xref ref-type="bibr" rid="ref31">31</xref>], such as multilayer long short-term memory (LSTM) [<xref ref-type="bibr" rid="ref32">32</xref>] or multilayer gate recurrent unit (GRU). In terms of improvements to RNNs, the text recurrent neural network (TextRNN) uses a multitask learning framework to jointly learn across multiple related tasks; a deep recurrent neural network (DRNN) [<xref ref-type="bibr" rid="ref23">23</xref>] incorporates position invariance into an RNN, captures local features to find the optimal window size, and then achieves marked improvements over RNN and CNN models. All these models have laid the foundation for follow-up studies.</p>
          <p>Bidirectional Encoder Representation from Transformers (BERT) has emerged as a new linguistic representation model by the introduction of attentional mechanisms, which have been broadly applied in machine translation [<xref ref-type="bibr" rid="ref32">32</xref>], image description generation [<xref ref-type="bibr" rid="ref33">33</xref>], machine reading comprehension [<xref ref-type="bibr" rid="ref34">34</xref>], and text classification [<xref ref-type="bibr" rid="ref35">35</xref>]. Being a bidirectional encoder model based on a transformer, BERT became an important advancement of natural language processing, especially text classification. For example, Shen et al [<xref ref-type="bibr" rid="ref36">36</xref>] attempted to train a Chinese corpus–based BERT<sub>base</sub> model for the classification of the literature on Chinese social science and technology and also explored its application to practical production. In addition, Lu and Ni [<xref ref-type="bibr" rid="ref37">37</xref>] developed a multilayer model for patent classification using the combination “BERT + CNN,” while Liu et al [<xref ref-type="bibr" rid="ref38">38</xref>] proposed a sentence-BERT for hierarchical clustering of literature abstracts. However, the accuracy of applying universal language models directly to the biomedical field is not sufficient, and this motivated studies to train the biomedical BERT from scratch. Typical instances are BioBERT pretrained on PubMed citations and PubMed Central (PMC) full text [<xref ref-type="bibr" rid="ref39">39</xref>] and PubMedBERT obtained with mixed-domain pretraining using PubMed text and clinical notes [<xref ref-type="bibr" rid="ref40">40</xref>]. Up to now, BioBERT and PubMedBERT have achieved success in named entity recognition, extraction of relationships between entities, entity normalization [<xref ref-type="bibr" rid="ref41">41</xref>,<xref ref-type="bibr" rid="ref42">42</xref>], <italic>International Classification of Diseases</italic> (ICD) autocoding [<xref ref-type="bibr" rid="ref43">43</xref>], and its multilabel classification (MLC) [<xref ref-type="bibr" rid="ref44">44</xref>]. These studies afford us lessons that merit attention.</p>
        </sec>
        <sec>
          <title>Multilabel Text Classification</title>
          <p>The deep learning model has contributed to the success of MLC due to its dynamic representation learning and end-to-end learning framework. Multilabel text classification (MLTC) is the application of MLC to the task of text classification and the assigning of a set of targeted labels to each sample [<xref ref-type="bibr" rid="ref45">45</xref>], which has been part of the longstanding challenge in both academia and industry. In the biomedical domain, Du et al [<xref ref-type="bibr" rid="ref46">46</xref>] proposed an end-to-end deep learning model ML-Net for biomedical text, while Glinka et al [<xref ref-type="bibr" rid="ref47">47</xref>] focused on a mixture of feature selection methods, filter, and wrapper methods. In addition, Hughes et al [<xref ref-type="bibr" rid="ref48">48</xref>] tried to classify medical text fragments at the sentence level based on a CNN, and Yogarajan et al [<xref ref-type="bibr" rid="ref49">49</xref>] used a multilabel variant of medical text classification to enhance the prediction of concurrent medical codes. Automatic question-and-answer systems and auxiliary decision-making are the 2 typical applications of MLTC. For example, Wasim et al [<xref ref-type="bibr" rid="ref50">50</xref>] proposed a classification model for multilabel problems in the flow of biomedical question-and-answer systems with factlike and listlike questions. Similarly, Baumel et al [<xref ref-type="bibr" rid="ref51">51</xref>] presented a hierarchical attentional bidirectional gated cyclic unit that used attention weights to better understand the sentence and word with the greatest impact on the decision.</p>
          <p>In this study, we adopted MLTC technology to classify cancer publications for better retrieval, academic analysis, and statistical evaluation. We introduced a method of multilabel classification for cancer research at the publication level based on the “BERT + X” model. BERT is a learning model that can migrate to other tasks to obtain better outcomes, which was pretrained on a large and easily accessible data set, and X is a deep learning model that can capture semantic features of text accurately. The combined model was trained on a corpus from a multilabel publication database, and then cancer publications were classified into appropriate categories directly at the publication level instead of the journal level.</p>
        </sec>
      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Study Design</title>
        <p>This study mainly aimed to train a deep learning–based multilabel classifier for cancer literature classification at the publication level. The overall framework of the study is illustrated in <xref rid="figure1" ref-type="fig">Figure 1</xref>. First, a corpus of titles and abstracts of cancer publications retrieved from the Dimensions database were divided into a training and a testing set in a ratio of 7:3 after preprocessing. Second, to capture sufficient text features for multilabel classification, the titles and abstracts were taken separately as 2 independent layers, which were called the “tuple” in this study. Finally, “BERT + X” classifiers based on 5 deep learning models were trained; X refers to “TextRNN,” “TextCNN,” “FastText,” “DPCNN,” and “DRNN.” The performance of the candidate classifiers was compared quantitatively in terms of 3 conventional metrics in order to identify the optimal model for classifying cancer literature.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Study framework. BERT: Bidirectional Encoder Representation from Transformers; DPCNN: deep pyramid convolutional neural network; DRNN: deep recurrent neural network; TextRNN: text recurrent neural network; TextCNN: text convolutional neural network.</p>
          </caption>
          <graphic xlink:href="medinform_v11i1e44892_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Data Collection and Preprocessing</title>
        <p>Refined data with semantic and context features are the basis of deep learning model training. In this study, to train a lightweight, compatible, and high-applicability classifier for text classification, we first preprocessed cancer literature data to extract features and sequential semantic information. The classification terminology maintained by the International Cancer Research Partnership (ICRP), called cancer type (CT), was used as standard labels to characterize individual cancer studies in terms of 62 CTs. The ICRP CT has been linked to the ICD maintained by WHO [<xref ref-type="bibr" rid="ref52">52</xref>] and is increasingly gaining rapid recognition worldwide. Moreover, the ICRP CT has been applied to several international databases for labeling cancer literature and research documents with fine granularity. A typical example is the Dimensions database (Digital Science &#38; Research Solutions, Inc), which covers more than 135 million publications, 6.5 million grants, and 153 million patents, providing a collaborative path to enhanced scientific discovery with transparent data sources. Importantly, cancer publications with ICRP CT–classified labels from the Dimensions database provide a way to prepare annotation data for model training.</p>
        <sec>
          <title>Construction of the Corpus and Balanced Sampling</title>
          <p>A set of 70,599 publications from 2003 to 2022 was randomly sampled from the Dimensions database using the keyword “cancer,” along with the ICPR CT labels for each publication. <xref rid="figure2" ref-type="fig">Figure 2</xref> shows the distribution of different CTs among the corpus data. Here, to intuitively demonstrate the volume distribution in the 62 different cancer categories, we ranked the categories in descending order of the number of corresponding publications included. Categories with sample sizes larger than 500 were listed separately, while the remaining 41 (66.13%) categories were grouped into 3 classes: CT22-CT35, n=14 (34.15%) categories; CT36-CT49, n=14 (34.15%); and CT50-CT62, n=13 (31.71%). The top 9 (14.52%) categories (breast cancer, non-site-specific cancer, colon and rectal cancer, lung cancer, prostate cancer, ovarian cancer, stomach cancer, cervical cancer, and pancreatic cancer) accounted for 76.35% (53,899/70,599) of the total corpus. Obviously, the distribution of labeling data was uneven, and the top 9 labels contained more than three-fourths of the total corpus. Once the original corpus was directly used to train the deep learning model without balanced sampling, the resulting classifier would cause overfitting due to a few categories with excessive volume and fail to be generalized in practical use.</p>
          <p>To avoid the degradation of precision caused by overfitting, we balanced the data sampling before model training. First, we ranked the cancer categories in descending order of the number of corresponding publications. Next, a threshold (70 in our study) used for setting the sampling index was obtained after multiple testing, followed by calculation of the index using categories with more than 70 publications. The resulting mean , median, variance, standard deviation of the number of samples contained in each category were recorded as follows: mean=1127, median=282, variance=5,889,927, and standard deviation=2427. Here, the median was selected as the initial index according to the actual distribution of sampling data. Considering that 30% of the corpus was used as the testing set, the final index was set to 500 in terms of the number of publications for a competent training set. Therefore, categories whose number of publications exceeded the final index were balanced and down-sampled separately, which means that 500 publications from each category were randomly extracted for a uniform corpus.</p>
          <p><xref ref-type="table" rid="table1">Table 1</xref> shows part of the balanced sampling results. It is clear that the optimized corpus contributed to a reduction in the adverse effects of overfitting and was subsequently used for keyword extraction and model training.</p>
          <fig id="figure2" position="float">
            <label>Figure 2</label>
            <caption>
              <p>Original sample distribution of CTs. CT: cancer type.</p>
            </caption>
            <graphic xlink:href="medinform_v11i1e44892_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
          <table-wrap position="float" id="table1">
            <label>Table 1</label>
            <caption>
              <p>Example of balanced sampling of top 21 categories (N=70,599 publications).</p>
            </caption>
            <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
              <col width="140"/>
              <col width="230"/>
              <col width="100"/>
              <col width="180"/>
              <col width="170"/>
              <col width="180"/>
              <thead>
                <tr valign="top">
                  <td>Sequence number</td>
                  <td>ICRP CT<sup>a</sup></td>
                  <td>ICRP code<sup>b</sup></td>
                  <td>ICD-10<sup>c</sup> code</td>
                  <td>Original sample<sup>d</sup>, n (%)</td>
                  <td>Balanced sample<sup>e</sup>, n (%)</td>
                </tr>
              </thead>
              <tbody>
                <tr valign="top">
                  <td>1</td>
                  <td>Breast cancer</td>
                  <td>7</td>
                  <td>C50</td>
                  <td>14,103 (19.98)</td>
                  <td>500 (3.55)</td>
                </tr>
                <tr valign="top">
                  <td>2</td>
                  <td>Non-site-specific cancer</td>
                  <td>2</td>
                  <td>N/A<sup>f</sup></td>
                  <td>12,170 (17.24)</td>
                  <td>500 (4.11)</td>
                </tr>
                <tr valign="top">
                  <td>3</td>
                  <td>Colon and rectal cancer</td>
                  <td>64</td>
                  <td>C18, C19, C20</td>
                  <td>6681 (9.46)</td>
                  <td>500 (7.48)</td>
                </tr>
                <tr valign="top">
                  <td>4</td>
                  <td>Lung cancer</td>
                  <td>28</td>
                  <td>C34, C45</td>
                  <td>6190 (8.77)</td>
                  <td>500 (8.08)</td>
                </tr>
                <tr valign="top">
                  <td>5</td>
                  <td>Prostate cancer</td>
                  <td>42</td>
                  <td>C61</td>
                  <td>3890 (5.51)</td>
                  <td>500 (12.85)</td>
                </tr>
                <tr valign="top">
                  <td>6</td>
                  <td>Ovarian cancer</td>
                  <td>66</td>
                  <td>C56</td>
                  <td>3294 (4.67)</td>
                  <td>500 (15.18)</td>
                </tr>
                <tr valign="top">
                  <td>7</td>
                  <td>Stomach cancer</td>
                  <td>51</td>
                  <td>C16</td>
                  <td>2783 (3.94)</td>
                  <td>500 (17.97)</td>
                </tr>
                <tr valign="top">
                  <td>8</td>
                  <td>Cervical cancer</td>
                  <td>9</td>
                  <td>C53</td>
                  <td>2659 (3.77)</td>
                  <td>500 (18.80)</td>
                </tr>
                <tr valign="top">
                  <td>9</td>
                  <td>Pancreatic cancer</td>
                  <td>37</td>
                  <td>C25</td>
                  <td>2129 (3.02)</td>
                  <td>500 (23.49)</td>
                </tr>
                <tr valign="top">
                  <td>10</td>
                  <td>Bladder cancer</td>
                  <td>3</td>
                  <td>C67</td>
                  <td>1197 (1.70)</td>
                  <td>500 (41.77)</td>
                </tr>
                <tr valign="top">
                  <td>11</td>
                  <td>Esophageal/oesophageal cancer</td>
                  <td>12</td>
                  <td>C15</td>
                  <td>1158 (1.64)</td>
                  <td>500 (43.18)</td>
                </tr>
                <tr valign="top">
                  <td>12</td>
                  <td>Endometrial cancer</td>
                  <td>11</td>
                  <td>C54</td>
                  <td>1131 (1.60)</td>
                  <td>500 (44.21)</td>
                </tr>
                <tr valign="top">
                  <td>13</td>
                  <td>Oral cavity and lip cancer</td>
                  <td>36</td>
                  <td>C00, C01, C02, C03, C04, C05, C06, C09</td>
                  <td>965 (1.37)</td>
                  <td>500 (51.81)</td>
                </tr>
                <tr valign="top">
                  <td>14</td>
                  <td>Liver cancer</td>
                  <td>23</td>
                  <td>C22</td>
                  <td>921 (1.30)</td>
                  <td>500 (54.29)</td>
                </tr>
                <tr valign="top">
                  <td>15</td>
                  <td>Thyroid cancer</td>
                  <td>54</td>
                  <td>C73</td>
                  <td>734 (1.04)</td>
                  <td>500 (68.12)</td>
                </tr>
                <tr valign="top">
                  <td>16</td>
                  <td>Melanoma</td>
                  <td>29</td>
                  <td>C43</td>
                  <td>702 (0.99)</td>
                  <td>500 (71.23)</td>
                </tr>
                <tr valign="top">
                  <td>17</td>
                  <td>Pharyngeal cancer</td>
                  <td>61</td>
                  <td>C14.0</td>
                  <td>661 (0.94)</td>
                  <td>500 (75.64)</td>
                </tr>
                <tr valign="top">
                  <td>18</td>
                  <td>Leukemia/leukaemia</td>
                  <td>27</td>
                  <td>C91, C92, C93, C94, C95</td>
                  <td>529 (0.75)</td>
                  <td>500 (94.52)</td>
                </tr>
                <tr valign="top">
                  <td>19</td>
                  <td>Laryngeal cancer</td>
                  <td>26</td>
                  <td>C32</td>
                  <td>522 (0.74)</td>
                  <td>500 (95.79)</td>
                </tr>
                <tr valign="top">
                  <td>20</td>
                  <td>Non-Hodgkin’s lymphoma</td>
                  <td>35</td>
                  <td>C82, C83, C84, C85, C96.3</td>
                  <td>514 (0.73)</td>
                  <td>500 (97.28)</td>
                </tr>
                <tr valign="top">
                  <td>21</td>
                  <td>Head and neck cancer</td>
                  <td>21</td>
                  <td>C76.0</td>
                  <td>502 (0.71)</td>
                  <td> 500 (99.60)</td>
                </tr>
              </tbody>
            </table>
            <table-wrap-foot>
              <fn id="table1fn1">
                <p><sup>a</sup>ICRP CT: International Cancer Research Partnership Cancer Type; here, “ICRP CT” denotes the label.</p>
              </fn>
              <fn id="table1fn2">
                <p><sup>b</sup>“ICRP code” refers to the label code.</p>
              </fn>
              <fn id="table1fn3">
                <p><sup>c</sup>ICD-10: International Classification of Diseases, Tenth Revision; this is the ICD code linked to the appropriate ICPR CT.</p>
              </fn>
              <fn id="table1fn4">
                <p><sup>d</sup>“Original sample” represents the number of publications obtained directly from the Dimensions database.</p>
              </fn>
              <fn id="table1fn5">
                <p><sup>e</sup>“Balanced sample” means the number of publications after balanced sampling.</p>
              </fn>
              <fn id="table1fn6">
                <p><sup>f</sup>N/A: not applicable.</p>
              </fn>
            </table-wrap-foot>
          </table-wrap>
        </sec>
        <sec>
          <title>Construction of a Tuple Consisting of a Title and an Abstract</title>
          <p>The corpus of cancer publications consisted of titles and abstracts in English, while the title and abstract of each publication was saved separately for ease of use. Generally, the title is a short sentence of a confined length to express an independent meaning, which has a high rate of conformity regarding the content. Comparatively, an abstract is also valuable, since it clearly and accurately summarizes the main content of the publication by expressing its purpose, methods, results, and conclusions. In this study, both title and abstract were independently used to train a 2-layer classifier based on their semantic and context features, called a tuple for simplicity.</p>
        </sec>
        <sec>
          <title>Keyword Extraction From the Abstracts of Cancer Publications</title>
          <p>In this study, in contrast to the abstract layer, the operation of the title layer mainly focused on keyword training. However, the number of valid keywords contained in titles is quite limited. To improve feature representation and model performance, more keywords were extracted from the abstracts and merged with the title layer. The TextRank algorithm [<xref ref-type="bibr" rid="ref53">53</xref>] was adopted for keyword extraction from the abstracts, taking advantage of the co-occurring semantics information between words from the given sentences.</p>
          <p>A lightweight classifier was desired in this study, so the length of the abstracts needed to be controlled to keep a balance between the running speed, effectiveness, and volume occupied. To ascertain the most appropriate abstract length, we analyzed the scatter plot of the abstract length distribution, as shown in <xref rid="figure3" ref-type="fig">Figure 3</xref>. Here, the horizontal axis represents the serial number of publications, the vertical axis represents the length of the publication abstracts, and the red (length&#62;512), green (256&#60;length≤512), blue (128&#60;length≤256), and orange (length≤128) colors represent different abstract lengths separately. Among them, the blue zone was evenly distributed and had a high proportion, the red zone had the least proportion, and the green and orange zones were comparable.</p>
          <p>After statistical analysis, the maximum length of the abstracts was set to 256 characters mainly for 3 reasons. First, 256 is the 8th power of 2, which facilitates machine understanding after tuning [<xref ref-type="bibr" rid="ref53">53</xref>]. Second, we wanted to collect the most valid information as much as possible, while reducing sparsity. Third, we wanted to avoid the learning of shallow networks, which are equivalent to follow-up layers when training (ie, gradient disappearance).</p>
          <fig id="figure3" position="float">
            <label>Figure 3</label>
            <caption>
              <p>Scatter plot of distribution of abstract length.</p>
            </caption>
            <graphic xlink:href="medinform_v11i1e44892_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
      </sec>
      <sec>
        <title>Training a Model for MLCT</title>
        <sec>
          <title>Upstream Pretrained Language Models</title>
          <p>Pretraining generally refers to putting a large amount of low-cost collected training data together, learning the commonalities of the data, and then tuning the model that has the commonalities with a small amount of labeled data of a specific domain. Therefore, pretrained language models start from the commonalities and learn the special parts of the specific task. BERT is a successful model pretrained on Wikipedia and a book corpus via self-supervision tasks, and fine-tuning benefits downstream tasks. Being a pretrained language model based on the bidirectional transformer encoder architecture, BERT uses sentence-level negative sampling to obtain sentence representation/sentence pair relationships. In addition, BERT takes advantage of the transformer model instead of LSTM for expressive and temporal efficiency, as well as the masked language model to extract contextual features. We used BERT to handle specific natural language processing tasks downstream to produce word vectors in the pretraining stage. During the fine-tuning, we then completed data training for the pretrained BERT through the output layer based on cancer publications in order to save time and improve accuracy.</p>
        </sec>
        <sec>
          <title>Downstream Classification Model Training</title>
          <p>To complete the actual task of downstream natural language processing based on the fine-tuned upstream procedure, we tried to train several preliminary language models and then chose one as the optimal model for our classifier according to its all-round performance. The “BERT + X” pattern was adopted for the classifier to determine the optimum option for X and the best way to combine BERT and X. According to the actual scenario and expert consultations, including the length, tightness of context, and multidisciplinarity, 5 models suitable for cancer publications were compared for the classification model: TextCNN, TextRNN, FastText, DPCNN, and DRNN. Eventually, the definitive combined classifier would come out dependent on the comprehensive performance analysis of these 5 models.</p>
          <p>The structure of the classification model is shown in <xref rid="figure4" ref-type="fig">Figure 4</xref>, where the TextRNN is selected as a representation of the 5 models, for example. Here, the title and abstract were input into the title layer and the abstract layer, respectively, while the word vectors were converted by BERT and passed to the encoder layer. The word vectors output from the title and abstract layers were stitched together and then transferred to the fully connected layer for normalization, while the final output of multilabel classification was generated by the sigmoid layer with the activation function.</p>
          <fig id="figure4" position="float">
            <label>Figure 4</label>
            <caption>
              <p>Structure of the classification model. BERT: Bidirectional Encoder Representation from Transformers; TextRNN: text recurrent neural network.</p>
            </caption>
            <graphic xlink:href="medinform_v11i1e44892_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
      </sec>
      <sec>
        <title>Testing and Verification</title>
        <p>To evaluate the performance of the trained classifier, a subset of the testing sample was selected from the corpus, which covered all 62 classification labels defined in the ICRP CT. We applied 3 frequently used indexes, namely precision, recall, and the <italic>F</italic><sub>1</sub>-score, to verify the classification results of the 5 models. Here, the <italic>F</italic><sub>1</sub>-score is the harmonic mean of precision and recall; the larger the <italic>F</italic><sub>1</sub>-score, the better the performance of the classification model. The quantitative indexes of the 5 “BERT + X” models were compared numerically and independently to choose X.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Quantitative Analysis of the Performance of Classification Models</title>
        <p>The test results of the combined classification downstream models are shown in <xref ref-type="table" rid="table2">Table 2</xref>, where we compared performance on 3 aspects (precision, recall, <italic>F</italic><sub>1</sub>-score) of 5 classification models (BERT + TextRNN, BERT + TextCNN, BERT + FastText, BERT + DPCNN, and BERT + DRNN). All metrics of BERT + TextRNN were consistently at a high level, with a precision of 93.09%, a recall of 87.75%, and an <italic>F</italic><sub>1</sub>-score of 90.34%. Here, BERT was directly used for fine-tuning training, combined with the TextRNN for multilabel classification. After adjusting and testing the parameters several times, the best parameters were obtained and are shown in <xref ref-type="table" rid="table3">Table 3</xref>.</p>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Performance comparison of 5 different “BERT<sup>a</sup> + X” models.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="300"/>
            <col width="260"/>
            <col width="200"/>
            <col width="240"/>
            <thead>
              <tr valign="top">
                <td>Model</td>
                <td>Precision (%)</td>
                <td>Recall (%)</td>
                <td><italic>F</italic><sub>1</sub>-score (%)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>BERT + TextRNN<sup>b</sup></td>
                <td>93.09</td>
                <td>87.75</td>
                <td>90.34</td>
              </tr>
              <tr valign="top">
                <td>BERT + TextCNN<sup>c</sup></td>
                <td>84.19</td>
                <td>79.69</td>
                <td>81.88</td>
              </tr>
              <tr valign="top">
                <td>BERT + FastText</td>
                <td>93.05</td>
                <td>75.73</td>
                <td>83.50</td>
              </tr>
              <tr valign="top">
                <td>BERT + DPCNN<sup>d</sup></td>
                <td>81.78</td>
                <td>75.00</td>
                <td>78.25</td>
              </tr>
              <tr valign="top">
                <td>BERT + DRNN<sup>e</sup></td>
                <td>88.98</td>
                <td>53.05</td>
                <td> 66.47</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table2fn1">
              <p><sup>a</sup>BERT: Bidirectional Encoder Representation from Transformers.</p>
            </fn>
            <fn id="table2fn2">
              <p><sup>b</sup>TextRNN: text recurrent neural network.</p>
            </fn>
            <fn id="table2fn3">
              <p><sup>c</sup>TextCNN: text convolutional neural network.</p>
            </fn>
            <fn id="table2fn4">
              <p><sup>d</sup>DPCNN: deep pyramid convolutional neural network.</p>
            </fn>
            <fn id="table2fn5">
              <p><sup>e</sup>DRNN: deep recurrent neural network.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Parameters of the optimal “BERT<sup>a</sup> + TextRNN<sup>b</sup>” model.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="430"/>
            <col width="570"/>
            <thead>
              <tr valign="top">
                <td>Parameter</td>
                <td>Value</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Num_ train_ epochs</td>
                <td>200.0</td>
              </tr>
              <tr valign="top">
                <td>Max_ seq_ length</td>
                <td>256</td>
              </tr>
              <tr valign="top">
                <td>leaning_ rate</td>
                <td>0.0001</td>
              </tr>
              <tr valign="top">
                <td>train_ batch_ size</td>
                <td>32</td>
              </tr>
              <tr valign="top">
                <td>Predict_ batch_ size</td>
                <td>32</td>
              </tr>
              <tr valign="top">
                <td>Drop</td>
                <td>0.5</td>
              </tr>
              <tr valign="top">
                <td>Dense1</td>
                <td>256</td>
              </tr>
              <tr valign="top">
                <td>Dense2</td>
                <td>62</td>
              </tr>
              <tr valign="top">
                <td>TextRNN</td>
                <td>256×2</td>
              </tr>
              <tr valign="top">
                <td>LTSM<sup>c</sup>_UNITS</td>
                <td>5</td>
              </tr>
              <tr valign="top">
                <td>BERT_OUTDIM</td>
                <td>768</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table3fn1">
              <p><sup>a</sup>BERT: Bidirectional Encoder Representation from Transformers.</p>
            </fn>
            <fn id="table3fn2">
              <p><sup>b</sup>TextRNN: text recurrent neural network.</p>
            </fn>
            <fn id="table3fn3">
              <p><sup>c</sup>LSTM: long short-term memory.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Supplementary Analysis of the Model Structure</title>
        <p>The proposed classification model takes the title and abstract of a publication as independent input, namely a tuple, as mentioned in the “Methods” section. To verify the effectiveness of the tuple input of the trained model, we conducted a set of comparison experiments based on “BERT + TextRNN.” Especially, “2 tuples and 2 levels” represents the model that took the title and abstract as 2 levels of the training model separately, “1 unit and 1 level” represents the model that combined the title and abstract as whole-text input for training, and “the title alone” and “the abstract alone” represent the models that took the title or the abstract alone as input, respectively. <xref ref-type="table" rid="table4">Table 4</xref> records the performance of different models from supplementary experiments, where the “2 tuples and 2 levels” model was superior, with a precision of 93.09%, a recall of 87.75%, and an <italic>F</italic><sub>1</sub>-score of 90.34%. The reason is that when applying the title or abstract alone to train the classification model, feature reduction occurs, which further leads to inferior performance of classification. In addition, compared with the “1 unit and 1 level” model taking the title and abstract as a 1-part text input, the “tuple and 2 levels” model enhanced the specificity of feature extraction. Notice that the title and abstract make different contributions to the subject of publication, and the classification model will lose the sufficient feature of the abstract if it is not trained separately. Eventually, the classification of the tuple input was elected for the proposed classification model. This is also identical to most of the subject-based literature processing, which take the title and abstract as independent text, such as subject indexing.</p>
        <p>In addition, the proposed classification model used the TextRank algorithm to extract keywords from the abstract and supplement the title layer with them. To demonstrate the necessity and effectiveness of this step, <xref rid="figure5" ref-type="fig">Figure 5</xref> shows the numerical indexes of the classification model with and without keyword extraction and supplementation. Here, the performance of the model with TextRank keyword extraction is shown in blue, and the results with direct training using titles and abstracts separately are plotted in green. It is obvious that the model without keyword supplementation had a lower performance in recall, precision, and the <italic>F</italic><sub>1</sub>-score, which confirms the efficiency and effectiveness of the proposed classification model from a different perspective.</p>
        <table-wrap position="float" id="table4">
          <label>Table 4</label>
          <caption>
            <p>Comparison of different types of input.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="350"/>
            <col width="240"/>
            <col width="190"/>
            <col width="220"/>
            <thead>
              <tr valign="top">
                <td>Input</td>
                <td>Precision (%)</td>
                <td>Recall (%)</td>
                <td><italic>F</italic><sub>1</sub>-score (%)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>2 tuples and 2 levels</td>
                <td>93.09</td>
                <td>87.75</td>
                <td>90.34</td>
              </tr>
              <tr valign="top">
                <td>1 unit and 1 level</td>
                <td>82.32</td>
                <td>79.78</td>
                <td>81.04</td>
              </tr>
              <tr valign="top">
                <td>The title alone</td>
                <td>44.37</td>
                <td>31.54</td>
                <td>36.88</td>
              </tr>
              <tr valign="top">
                <td>The abstract alone</td>
                <td>85.50</td>
                <td>79.79</td>
                <td> 82.55</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <fig id="figure5" position="float">
          <label>Figure 5</label>
          <caption>
            <p>Comparison of the model with and without keyword supplementation.</p>
          </caption>
          <graphic xlink:href="medinform_v11i1e44892_fig5.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Comprehensive Analysis of the Multilabel Classification</title>
        <p>To explore whether there was a particular regularity in the distribution of multiple labels among different categories, the proportion of multilabel publications was statistically analyzed for classifier training. In total, 15,296 (21.67%) of the 70,599 publications had 2 or more labels, that is, more than one-fifth of the publications were multilabel ones. In addition, the categories were counted based on the characteristics of the number of labels (<xref rid="figure6" ref-type="fig">Figure 6</xref>) to visualize multilabel distributions. Here, we listed the top 20 categories by the volume of the publications included. The blue color refers to the total number of samples collected under a specific category, the green color is the number of samples with multiple labels under that category, and the yellow color denotes those with at least 3 labels. The categories with fewer samples had a higher ratio of multiple labels, and multiple labels had different characteristics among different categories. Analysis for a deeper relationship between multiple labels is necessary.</p>
        <p>There are principally 2 roles of comprehensive analysis of multilabel publications. First, it highlighted the process of balanced sampling. Since part of the publications belonged to multiple categories and some of the categories had a high co-occurrence frequency compared to other categories, direct model training on the original corpus would lead to overfitting due to uneven distribution of samples. This is why we selected multilabel papers instead of those with a single label in order to obtain a balanced sample for classifier training. Second, the multilabel publications revealed the potential semantic correlation of texts, which provided a direction for the analysis of data characteristics. Based on the co-occurrence correlation and distribution between different categories, the semantic features were further characterized and the proposed classification model extended to other data with the same characteristics.</p>
        <p>To explore the inherent correlation between multiple labels, we selected 2500 multilabel publications from the corpus for characteristics analysis. Specifically, samples with 2 labels accounted for 59.04% (1476/2500) and samples with at least 3 labels accounted for 40.96% (1024/2500) of all publications. <xref ref-type="table" rid="table5">Table 5</xref> lists part of the analysis results. For instance, different CTs often co-occurred for statistical surveys in the literature review with a weak association.</p>
        <p>The correlation strength of multiple labels of cancer publications were independently reviewed and assessed by 3 biocurators with relevant knowledge. Concretely, a publication with 2 labels and a clear semantic correlation within the corresponding subject classification labels was interpreted as “1,” while a publication with 3 or more labels and more than two-third of the labels holding an obvious semantic association were also considered as “1”. Once the 2 biocurators reached the same results, that specific publication was passed into the “review completed” data set. When they had different opinions, the corresponding publication was annotated as “pending review.” After the first round of reviewing, the “pending review” data set was discussed together for the second time, and a third biocurator was invited for confirmation and agreement.</p>
        <p><xref rid="figure7" ref-type="fig">Figure 7</xref> shows specific numbers of labeled publications with interlabel correlation, where the “strong association” zone consists of publications whose co-occurrence labels had explicit links between semantics, the “low association” zone consists of publications whose co-occurrence labels did not have clearly semantic links, and the “independent examples” zone consists of publications whose cancer labels were taken as single entities or independent examples for observation without intrinsic correlations. Of the 1476 publications with 2 labels, 1201 (81.37%) had a strong association, while 572/1024 (55.86%) publications with at least 3 labels had a low association. Among the publications with lowly correlated labels, 718/1024 (70.12%) took the different categories of cancers as a single entity or independent examples for observation without intrinsic correlations. We noticed some possible influence on the association distributions for training. In addition, the relationship between 2 labels in a publication was stronger than that among 3 or more labels, which justifies the demand to classify publications by subject at the publication level. Therefore, the strength of interlabel association could achieve the effect of assisting decision-making after multilabel classification to further support clinical diagnosis and treatment. In the future, we will carry out knowledge mining based on the existing interlabel semantic network and strengthen the training of interlabel association to improve the performance of the proposed classification model.</p>
        <fig id="figure6" position="float">
          <label>Figure 6</label>
          <caption>
            <p>Comparison of samples with multilabels.</p>
          </caption>
          <graphic xlink:href="medinform_v11i1e44892_fig6.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <table-wrap position="float" id="table5">
          <label>Table 5</label>
          <caption>
            <p>Examples of data evaluated by experts.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="100"/>
            <col width="700"/>
            <col width="100"/>
            <col width="100"/>
            <thead>
              <tr valign="top">
                <td>Sequence number</td>
                <td>Title</td>
                <td>Labels, n</td>
                <td>Correlation strength<sup>a</sup></td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>1</td>
                <td>Temporal Trends of Subsequent Breast Cancer Among Women With Ovarian Cancer: A Population-Based Study [<xref ref-type="bibr" rid="ref54">54</xref>]</td>
                <td>2</td>
                <td>1</td>
              </tr>
              <tr valign="top">
                <td>2</td>
                <td>Clinical Characteristics and Survival Outcomes of Patients With Both Primary Breast Cancer and Primary Ovarian Cancer [<xref ref-type="bibr" rid="ref55">55</xref>]</td>
                <td>2</td>
                <td>1</td>
              </tr>
              <tr valign="top">
                <td>3</td>
                <td>Secondary Malignancies in Long-Term Ovarian Cancer Survivors: Results of the “Carolin Meets HANNA” Study [<xref ref-type="bibr" rid="ref56">56</xref>]</td>
                <td>2</td>
                <td>1</td>
              </tr>
              <tr valign="top">
                <td>4</td>
                <td>Trends in Participation Rates of the National Cancer Screening Program among Cancer Survivors in Korea [<xref ref-type="bibr" rid="ref57">57</xref>]</td>
                <td>3</td>
                <td>0</td>
              </tr>
              <tr valign="top">
                <td>5</td>
                <td>Increasing Trends in the Prevalence of Prior Cancer in Newly Diagnosed Lung, Stomach, Colorectal, Breast, Cervical, and Corpus Uterine Cancer Patients: A Population-Based Study [<xref ref-type="bibr" rid="ref58">58</xref>]</td>
                <td>4</td>
                <td>1</td>
              </tr>
              <tr valign="top">
                <td>6</td>
                <td>Cancer Registration in China and Its Role in Cancer Prevention and Control [<xref ref-type="bibr" rid="ref59">59</xref>]</td>
                <td>3</td>
                <td>0</td>
              </tr>
              <tr valign="top">
                <td>7</td>
                <td>Cancer Incidence, Mortality, and Burden in China: A Time‐Trend Analysis and Comparison With the United States and United Kingdom Based on the Global Epidemiological Data Released in 2020 [<xref ref-type="bibr" rid="ref60">60</xref>]</td>
                <td>5</td>
                <td>0</td>
              </tr>
              <tr valign="top">
                <td>8</td>
                <td>Excess Costs and Economic Burden of Obesity-Related Cancers in the United States [<xref ref-type="bibr" rid="ref61">61</xref>]</td>
                <td>3</td>
                <td>1</td>
              </tr>
              <tr valign="top">
                <td>9</td>
                <td>Cancer Attributable to Human Papillomavirus Infection in China: Burden and Trends [<xref ref-type="bibr" rid="ref62">62</xref>]</td>
                <td>4</td>
                <td>0</td>
              </tr>
              <tr valign="top">
                <td>10</td>
                <td>Excess Costs and Economic Burden of Obesity-Related Cancers in the United States [<xref ref-type="bibr" rid="ref63">63</xref>]</td>
                <td>3</td>
                <td>1</td>
              </tr>
              <tr valign="top">
                <td>11</td>
                <td>Cancer Awareness in the General Population varies With Sex, Age and Media Coverage: A Population-Based Survey With Focus on Gynecologic Cancers [<xref ref-type="bibr" rid="ref64">64</xref>]</td>
                <td>5</td>
                <td>0</td>
              </tr>
              <tr valign="top">
                <td>12</td>
                <td>Public Attitudes Towards Cancer Survivors Among Korean Adults [<xref ref-type="bibr" rid="ref65">65</xref>]</td>
                <td>3</td>
                <td>0</td>
              </tr>
              <tr valign="top">
                <td>13</td>
                <td>Importance of Hospital Cancer Registries in Africa [<xref ref-type="bibr" rid="ref66">66</xref>]</td>
                <td>2</td>
                <td>0</td>
              </tr>
              <tr valign="top">
                <td>14</td>
                <td>Correlation Between Family History and Characteristics of Breast Cancer [<xref ref-type="bibr" rid="ref67">67</xref>]</td>
                <td>2</td>
                <td>1</td>
              </tr>
              <tr valign="top">
                <td>15</td>
                <td>Familial Aggregation of Early‐Onset Cancers [<xref ref-type="bibr" rid="ref68">68</xref>]</td>
                <td>3</td>
                <td>0</td>
              </tr>
              <tr valign="top">
                <td>16</td>
                <td>Trends in Regional Cancer Mortality in Taiwan 1992–2014 [<xref ref-type="bibr" rid="ref69">69</xref>]</td>
                <td>6</td>
                <td>0</td>
              </tr>
              <tr valign="top">
                <td>17</td>
                <td>Statin Use and Incidence and Mortality of Breast and Gynecology Cancer: A Cohort Study Using the National Health Insurance Claims database [<xref ref-type="bibr" rid="ref70">70</xref>]</td>
                <td>4</td>
                <td>1</td>
              </tr>
              <tr valign="top">
                <td>18</td>
                <td>Management of Breast Cancer Risk in BRCA1/2 Mutation Carriers Who Are Unaffected With Cancer [<xref ref-type="bibr" rid="ref71">71</xref>]</td>
                <td>2</td>
                <td>1</td>
              </tr>
              <tr valign="top">
                <td>19</td>
                <td>Association Between Diabetes, Obesity, Aging, and Cancer: Review of Recent Literature [<xref ref-type="bibr" rid="ref72">72</xref>]</td>
                <td>4</td>
                <td>0</td>
              </tr>
              <tr valign="top">
                <td>20</td>
                <td>The European Cancer Burden in 2020: Incidence and Mortality Estimates for 40 Countries and 25 Major Cancers [<xref ref-type="bibr" rid="ref73">73</xref>]</td>
                <td>3</td>
                <td> 0</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table5fn1">
              <p><sup>a</sup>In the last column, “1” refers to a strong correlation, which means 2 labels of a given publication are semantically or syntactically linked to each other, such as relaying, concurrency, and coupling effects. Conversely, “0” indicates a weak association between multiple labels of a specific publication, and there is no obvious semantic or syntactic correlation.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <fig id="figure7" position="float">
          <label>Figure 7</label>
          <caption>
            <p>Relational mapping of multilabel publication distributions.</p>
          </caption>
          <graphic xlink:href="medinform_v11i1e44892_fig7.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>There are several reasons for the “BERT + TextRNN” model to show optimal performance in cancer publication classification. First, cancer publications usually consist of long texts (eg, titles and abstracts) containing specialty terms and intensive contextual semantic correlations, which are quite suitable for the TextRNN model, which is good at processing sequential information with strong correlation and a high degree of uniformity. Moreover, comprehensive analysis of multilabel classification reflects that cancer publications are characterized by a high multilabel rate in areas with low research intensity due to the interdisciplinary and cooperative working, which enhances the contextual correlation to a certain extent. The “BERT + TextRNN” model is more likely to be efficient in such fields because it can effectively capture contextual semantics.</p>
        <p>Compared with the TextRNN, the other models were insufficient and could be further improvement. The TextCNN might not be able to capture sufficient features, since it is not highly interpretable and well suited to address the fixed-length horizon issue. Although the DRNN is an enhanced version of the RNN with low computational speed, it fails to consider any upcoming input to the current state. Therefore, the DRNN is much less effective than the TextRNN. Being a long-linear model, FastText hardly handles the recognition of the long text of cancer publications and needs further optimization due to a limited recall rate.</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>The proposed classifier based on the “BERT + TextRNN” model has 2 issues. On the one hand, the performance of the classifier may be reduced due to the accumulation of errors caused by keyword extraction, which will be enhanced by adjusting the model parameters and adding a self-testing function. On the other hand, the tuple input of titles and abstracts was integrated to train the multilabel classifier, which proved to be better than the input of titles or abstracts alone. Therefore, cancer publications with both title and abstract are desired for the proposed classifier. However, for the few cancer publications papers without abstracts, the classifier we trained will still be usable and has a slight performance cost.</p>
      </sec>
      <sec>
        <title>Major Applications of the Proposed Classifier</title>
        <p>We trained a classifier based on the “BERT + TextRNN” model for classifying the cancer literature at the publication level, which could directly assign multiple labels to each publication. The proposed classifier has at least 2 major applications. First, the desired model can achieve efficient and effective multilabel classification of cancer publications more granularly, not only for cancer publications in English, but also for full-text literature in other language whose titles and abstracts have English versions. Since the trained classifier is based on cancer publications with titles and abstracts, it should be suitable for any papers whose titles and abstracts are written in English (eg, Chinese medical publications). Another significant application is the fine-grained classification of scientific data on cancer research. Given that valuable data are accompanied by a brief description in English, the proposed model will classify them into the groups with appropriate CTs. Therefore, a content-based label in terms of CTs will be assigned to scientific data and literature, which provides a way to construct a full spectrum of data foundation for precision medicine.</p>
      </sec>
      <sec>
        <title>Conclusion</title>
        <p>Given that existing classification methods are at the journal level and there is an urgent need for subject classification due to the proliferation of cancer research, a multilabel classifier was trained based on deep learning models, specifically “BERT + TextRNN.” Moreover, the proposed high-resolution classification model was evaluated as being efficient and effective for cancer publications in terms of quantitative comparison and feature analysis.</p>
        <p>The innovative exploration in this study is as follows:</p>
        <list list-type="bullet">
          <list-item>
            <p>The “BERT + TextRNN” classification model was trained for classifying cancer literature at the publication level, which shows promise in automatically assigning each publication at least 1 label to which it belongs.</p>
          </list-item>
          <list-item>
            <p>The proposed model achieves high-quality multilabel classification at the publication level, which could reflect the features of cancer publications more accurately with multiple labels compared to the existing method that annotates papers with a single label at the journal level.</p>
          </list-item>
          <list-item>
            <p>By comprehensive analysis of the correlation between multiple labels, as well as the data characteristics of multilabel cancer publications, the proposed model was verified to be suitable for the literature with features such as high specialization, uniform entity nouns, and standardized long texts.</p>
          </list-item>
        </list>
        <p>In the future, the classification model will be extended to classify medical literature on cardiovascular disease and diabetes, where a great number of highly specialized publications have accumulated and are attracting increasing research attention, in order to improve health conditions worldwide.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group/>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">BERT</term>
          <def>
            <p>Bidirectional Encoder Representation from Transformers</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">CNN</term>
          <def>
            <p>convolutional neural network</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">CT</term>
          <def>
            <p>cancer type</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">DPCNN</term>
          <def>
            <p>deep pyramid convolutional neural network</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">DRNN</term>
          <def>
            <p>deep recurrent neural network</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">ICD</term>
          <def>
            <p>International Classification of Diseases</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">ICD-10</term>
          <def>
            <p>International Classification of Diseases, Tenth Revision</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">ICRP CT</term>
          <def>
            <p>International Cancer Research Partnership Cancer Type</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb9">LSTM</term>
          <def>
            <p>long short-term memory</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb10">MLC</term>
          <def>
            <p>multilabel classification</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb11">MLTC</term>
          <def>
            <p>multilabel text classification</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb12">RNN</term>
          <def>
            <p>recurrent neural network</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb13">TextRNN</term>
          <def>
            <p>text recurrent neural network</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb14">TextCNN</term>
          <def>
            <p>text convolutional neural network</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
  <p>This work was supported by the Innovation Fund for Medical Sciences of Chinese Academy of Medical Sciences (grant: 2021-I2M-1-033) and the Fundamental Research Funds for the Central Universities (grant:3332023163).</p>
</ack>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ferlay</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Ervik</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Lam</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Colombet</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Mery</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Piñeros</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Cancer today: data visualization tools for exploring the global cancer burden in 2020</article-title>
          <source>International Agency for Research on Cancer</source>
          <year>2020</year>
          <access-date>2023-09-07</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://gco.iarc.fr/today,">https://gco.iarc.fr/today,</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Becher</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>The significance of disciplinary differences</article-title>
          <source>Stud Higher Educ</source>
          <year>1994</year>
          <month>01</month>
          <volume>19</volume>
          <issue>2</issue>
          <fpage>151</fpage>
          <lpage>161</lpage>
          <pub-id pub-id-type="doi">10.1080/03075079412331382007</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bensaude-Vincent</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Discipline-building in synthetic biology</article-title>
          <source>Stud Hist Philos Biol Biomed Sci</source>
          <year>2013</year>
          <month>06</month>
          <volume>44</volume>
          <issue>2</issue>
          <fpage>122</fpage>
          <lpage>129</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://core.ac.uk/reader/52817072?utm_source=linkout"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.shpsc.2013.03.007</pub-id>
          <pub-id pub-id-type="medline">23566941</pub-id>
          <pub-id pub-id-type="pii">S1369-8486(13)00021-6</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Minaee</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kalchbrenner</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Cambria</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Nikzad</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Chenaghlu</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Gao</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Deep learning-based text classification: a comprehensive review</article-title>
          <source>ACM Comput Surv</source>
          <year>2021</year>
          <month>04</month>
          <day>17</day>
          <volume>54</volume>
          <issue>3</issue>
          <fpage>1</fpage>
          <lpage>40</lpage>
          <pub-id pub-id-type="doi">10.1145/3439726</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Shen</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Henao</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Carin</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Joint embedding of words and labels for text classification</article-title>
          <year>2018</year>
          <conf-name>56th Annual Meeting of the Association for Computational Linguistics</conf-name>
          <conf-date>July 15-20, 2018</conf-date>
          <conf-loc>Melbourne, Australia</conf-loc>
          <pub-id pub-id-type="doi">10.18653/v1/P18-1216</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Conneau</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Schwenk</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Barrault</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Lecun</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Very deep convolutional networks for text classification</article-title>
          <year>2017</year>
          <conf-name>15th Conference of the European Chapter of the Association for Computational Linguistics</conf-name>
          <conf-date>April 2017</conf-date>
          <conf-loc>Valencia, Spain</conf-loc>
          <fpage>1107</fpage>
          <lpage>1116</lpage>
          <pub-id pub-id-type="doi">10.18653/v1/e17-1104</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Luo</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>Automatic discipline classification for scientific papers based on a deep pre-training language model</article-title>
          <source>J China Soc Sci Tech Inf</source>
          <year>2020</year>
          <volume>39</volume>
          <issue>10</issue>
          <fpage>1046</fpage>
          <lpage>1059</lpage>
          <pub-id pub-id-type="doi">10.1117/12.2311282</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="web">
          <article-title>CSSC category to Web of Science category mapping 2012</article-title>
          <source>Clarivate Analytics</source>
          <access-date>2023-09-09</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://incites.help.clarivate.com/Content/Research%20Areas/china-scadc-subject-categories.htm">http://incites.help.clarivate.com/Con tent/Research%20Areas/china-scadc-subject-categories.htm</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hong</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Jia</surname>
              <given-names>YX</given-names>
            </name>
          </person-group>
          <article-title>International influence evaluation on disciplines of universities in Shanghai: a bibliometric analysis based on InCites database</article-title>
          <source>Fudan Education Forum</source>
          <year>2014</year>
          <volume>12</volume>
          <issue>4</issue>
          <fpage>29</fpage>
          <lpage>34</lpage>
          <pub-id pub-id-type="doi">10.13397/j.cnki.fef.2014.04.006</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fang</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Classifying research articles in multidisciplinary sciences journals into subject categories</article-title>
          <source>KO</source>
          <year>2015</year>
          <volume>42</volume>
          <issue>3</issue>
          <fpage>139</fpage>
          <lpage>153</lpage>
          <pub-id pub-id-type="doi">10.5771/0943-7444-2015-3-139</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Taheriyan</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Subject classification of research papers based on interrelationships analysis</article-title>
          <year>2011</year>
          <conf-name>KDMS 2011: Workshop on Knowledge Discovery, Modeling and Simulation</conf-name>
          <conf-date>August 21-24, 2011</conf-date>
          <conf-loc>San Diego, CA</conf-loc>
          <fpage>39</fpage>
          <lpage>44</lpage>
          <pub-id pub-id-type="doi">10.1145/2023568.2023579</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>X</given-names>
            </name>
          </person-group>
          <article-title>An interdisciplinary literature classifier based on multi-task multi-label learning</article-title>
          <year>2021</year>
          <conf-name>2021 International Conference on Asian Language Processing (IALP)</conf-name>
          <conf-date>December 11-13, 2021</conf-date>
          <conf-loc>Singapore</conf-loc>
          <pub-id pub-id-type="doi">10.1109/ialp54817.2021.9675234</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yan</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Analysis on the evolution trend and characteristics of multidisciplinary oncology team</article-title>
          <source>Shanxi Medical University</source>
          <year>2021</year>
          <access-date>2023-09-09</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://kns.cnki.net/kcms/detail/detail.aspx?doi=10.27288/d.cnki.gsxyu.2021.000023&#38;dbcode=CDFD">http://kns.cnki.net/kcms/detail/detail.aspx?doi=10.27288/d.cnki.gsxyu.2021.000023&#38;dbcode=CDFD</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lyu</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Feng</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Shi</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Han</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>Cancer research driven by cutting-edge multi-disciplinary technologies</article-title>
          <source>Chin Sci Bull</source>
          <year>2020</year>
          <month>7</month>
          <day>1</day>
          <volume>65</volume>
          <issue>31</issue>
          <fpage>3446</fpage>
          <lpage>3460</lpage>
          <pub-id pub-id-type="doi">10.1360/tb-2020-0638</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Zheng</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Xiang</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Tan</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Research progress of text classification technology based on deep learning</article-title>
          <source>Comput Eng</source>
          <year>2021</year>
          <volume>47</volume>
          <issue>02</issue>
          <fpage>1</fpage>
          <lpage>11</lpage>
          <pub-id pub-id-type="doi">10.19678/j.issn.1000-3428.0059099</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Maron</surname>
              <given-names>ME</given-names>
            </name>
          </person-group>
          <article-title>Automatic indexing: an experimental inquiry</article-title>
          <source>ACM</source>
          <year>1961</year>
          <month>07</month>
          <volume>8</volume>
          <issue>3</issue>
          <fpage>404</fpage>
          <lpage>417</lpage>
          <pub-id pub-id-type="doi">10.1145/321075.321084</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Luo</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Phung</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Tran</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Gupta</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Rana</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Karmakar</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Shilton</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Yearwood</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Dimitrova</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Ho</surname>
              <given-names>TB</given-names>
            </name>
            <name name-style="western">
              <surname>Venkatesh</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Berk</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Guidelines for developing and reporting machine learning predictive models in biomedical research: a multidisciplinary view</article-title>
          <source>J Med Internet Res</source>
          <year>2016</year>
          <month>12</month>
          <day>16</day>
          <volume>18</volume>
          <issue>12</issue>
          <fpage>e323</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2016/12/e323/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/jmir.5870</pub-id>
          <pub-id pub-id-type="medline">27986644</pub-id>
          <pub-id pub-id-type="pii">v18i12e323</pub-id>
          <pub-id pub-id-type="pmcid">PMC5238707</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Joachims</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Text category with support vector machines: learning with many relevant features</article-title>
          <year>1998</year>
          <conf-name>ECML 1998: 10th European Conference on Machine Learning</conf-name>
          <conf-date>April 21-23, 1998</conf-date>
          <conf-loc>Chemnitz, Germany</conf-loc>
          <fpage>137</fpage>
          <lpage>142</lpage>
          <pub-id pub-id-type="doi">10.1007/bfb0026683</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rasjid</surname>
              <given-names>ZE</given-names>
            </name>
            <name name-style="western">
              <surname>Setiawan</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Performance comparison and optimization of text document classification using k-NN and naïve Bayes classification techniques</article-title>
          <source>Procedia Comput Sci</source>
          <year>2017</year>
          <volume>116</volume>
          <fpage>107</fpage>
          <lpage>112</lpage>
          <pub-id pub-id-type="doi">10.1016/j.procs.2017.10.017</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Tokuda</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Nagai</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>A new differential LSI space-based probabilistic document classifier</article-title>
          <source>Inf Process Lett</source>
          <year>2003</year>
          <month>12</month>
          <volume>88</volume>
          <issue>5</issue>
          <fpage>203</fpage>
          <lpage>212</lpage>
          <pub-id pub-id-type="doi">10.1016/j.ipl.2003.09.002</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pennington</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Socher</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Manning</surname>
              <given-names>CD</given-names>
            </name>
          </person-group>
          <article-title>GloVe: global vectors for word representation</article-title>
          <year>2014</year>
          <conf-name>2014 Conference on Empirical Methods in Natural Language Processing (EMNLP)</conf-name>
          <conf-date>October 2014</conf-date>
          <conf-loc>Doha, Qatar</conf-loc>
          <pub-id pub-id-type="doi">10.3115/v1/d14-1162</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mikolov</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Corrado</surname>
              <given-names>GS</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Dean</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Efficient estimation of word representations in vector space</article-title>
          <source>arXiv:1301.3781v3 [cs.CL] </source>
          <comment>Preprint posted online January 16, 2013.</comment>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.48550/arXiv.1301.3781"/>
          </comment>
          <pub-id pub-id-type="doi">10.48550/arXiv.1301.3781</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Siwei</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Word and document embeddings based on neural network approaches</article-title>
          <source>arXiv:1611.05962v1 [cs.CL]</source>
          <comment>Preprint posted online November 18, 2016.</comment>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.48550/arXiv.1611.05962"/>
          </comment>
          <pub-id pub-id-type="doi">10.48550/arXiv.1611.05962</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lai</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Recurrent convolutional neural networks for text classification</article-title>
          <year>2015</year>
          <conf-name>AAAI'15: Twenty-Ninth AAAI Conference on Artificial Intelligence</conf-name>
          <conf-date>January 25-30, 2015</conf-date>
          <conf-loc>Austin, TX</conf-loc>
          <pub-id pub-id-type="doi">10.1609/aaai.v29i1.9513</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kalchbrenner</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Grefenstette</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Blunsom</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>A convolutional neural network for modelling sentences</article-title>
          <year>2014</year>
          <conf-name>52nd Annual Meeting of the Association for Computational Linguistics</conf-name>
          <conf-date>June 22-27, 2014</conf-date>
          <conf-loc>Baltimore, MD</conf-loc>
          <pub-id pub-id-type="doi">10.3115/v1/p14-1062</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Convolutional neural networks for sentence classificationC</article-title>
          <year>2014</year>
          <conf-name>2014 Conference on Empirical Methods in Natural Language Processing (EMNLP)</conf-name>
          <conf-date>October 2014</conf-date>
          <conf-loc>Doha, Qatar</conf-loc>
          <fpage>1746</fpage>
          <lpage>1751</lpage>
          <pub-id pub-id-type="doi">10.3115/v1/d14-1181</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>JB</given-names>
            </name>
            <name name-style="western">
              <surname>Lecun</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Character-level convolutional networks for text classificationC</article-title>
          <year>2015</year>
          <conf-name>28th International Conference on Neural Information Processing Systems</conf-name>
          <conf-date>December 7-12, 2015</conf-date>
          <conf-loc>Montreal Canada</conf-loc>
          <fpage>649</fpage>
          <lpage>657</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Joulin</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Grave</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Bojanowski</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Mikolov</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Bag of tricks for efficient text classification</article-title>
          <year>2017</year>
          <conf-name>EACL 2017: 15th Conference of the European Chapter of the Association for Computational Linguistics</conf-name>
          <conf-date>April 3-7, 2017</conf-date>
          <conf-loc>Valencia, Spain</conf-loc>
          <fpage>427</fpage>
          <lpage>431</lpage>
          <pub-id pub-id-type="doi">10.18653/v1/e17-2068</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hong</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Oh</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Han</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Learning transferrable knowledge for semantic segmentation with deep convolutional neural network</article-title>
          <year>2016</year>
          <conf-name>2016 IEEE Conference on Computer Vision and Pattern Recognition (CVPR)</conf-name>
          <conf-date>June 26-July 1, 2016</conf-date>
          <conf-loc>Las Vegas, NV</conf-loc>
          <fpage>3204</fpage>
          <lpage>3212</lpage>
          <pub-id pub-id-type="doi">10.1109/cvpr.2016.349</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Deep pyramid convolutional neural networks for text categorization</article-title>
          <year>2017</year>
          <conf-name>55th Annual Meeting of the Association for Computational Linguistics</conf-name>
          <conf-date>July 2017</conf-date>
          <conf-loc>Vancouver, Canada</conf-loc>
          <fpage>562</fpage>
          <lpage>570</lpage>
          <pub-id pub-id-type="doi">10.18653/v1/p17-1052</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Xiao</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Cho</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Efficient character-level document classification by combining convolution and recurrent layers</article-title>
          <source>arXiv:1602.00367v1 [cs.CL]</source>
          <comment>Preprint posted online February 1, 2016.</comment>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.48550/arXiv.1602.00367"/>
          </comment>
          <pub-id pub-id-type="doi">10.48550/arXiv.1602.00367</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bahdanau</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Cho</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Bengio</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Neural machine translation by jointly learning to align and translate</article-title>
          <source>arXiv:1409.0473v7 [cs.CL] </source>
          <comment>Preprint posted online September 1, 2014. </comment>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.48550/arXiv.1409.0473"/>
          </comment>
          <pub-id pub-id-type="doi">10.48550/arXiv.1409.0473</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cho</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>van Merrienboer</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Gulcehre</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Bougares</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Schwenk</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Bengio</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Learning phrase representations using RNN encoder-decoder for statistical machine translation</article-title>
          <source>arXiv:1406.1078v3 [cs.CL] </source>
          <comment>Preprint posted online June 3, 2014.</comment>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.48550/arXiv.1406.1078"/>
          </comment>
          <pub-id pub-id-type="doi">10.48550/arXiv.1406.1078</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hermann</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Kočiský</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Grefenstette</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Espeholt</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Kay</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Suleyman</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Blunsom</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Teaching machines to read and comprehend</article-title>
          <source>arXiv:1506.03340v3 [cs.CL] </source>
          <comment>Preprint posted online June 10, 2015.</comment>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.48550/arXiv.1506.03340"/>
          </comment>
          <pub-id pub-id-type="doi">10.48550/arXiv.1506.03340</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Dyer</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>He</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Smola</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Hovy</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Hierarchical attention networks for document classification</article-title>
          <year>2016</year>
          <conf-name>2016 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies</conf-name>
          <conf-date>June 2016</conf-date>
          <conf-loc>San Diego, CA</conf-loc>
          <fpage>1480</fpage>
          <lpage>1489</lpage>
          <pub-id pub-id-type="doi">10.18653/v1/n16-1174</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lili</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Peng</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Jing</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>A study on the automatic classification of chinese literature in periodicals based on BERT model</article-title>
          <source>Library J</source>
          <year>2022</year>
          <volume>41</volume>
          <issue>05</issue>
          <fpage>135</fpage>
          <lpage>118+135</lpage>
          <pub-id pub-id-type="doi">10.13663/j.cnki.lj.2022.05.014</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Xiaolei</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Bin</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>BERT-CNN: a hierarchical patent classifier based on pre-trained language model</article-title>
          <source>arXiv:1911.06241v1 [cs.CL] </source>
          <comment>Preprint posted online November 3, 2019.</comment>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.48550/arXiv.1911.06241"/>
          </comment>
          <pub-id pub-id-type="doi">10.48550/arXiv.1911.06241</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>He</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Shen</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Study on the discipline classification of massive humanities and social science academic literature driven by deep learning</article-title>
          <source>Inf Stud Theory Appl</source>
          <year>2020</year>
          <month>10</month>
          <day>20</day>
          <fpage>71</fpage>
          <lpage>81</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://kns.cnki.net/kcms/detail/11.1762.G3.20220823.1138.004.html"/>
          </comment>
          <pub-id pub-id-type="doi">10.16353/j.cnki.1000-7490.2023.02.009</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Yoon</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>So</surname>
              <given-names>CH</given-names>
            </name>
            <name name-style="western">
              <surname>Kang</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>BioBERT: a pre-trained biomedical language representation model for biomedical text mining</article-title>
          <source>Bioinformatics</source>
          <year>2020</year>
          <month>02</month>
          <day>15</day>
          <volume>36</volume>
          <issue>4</issue>
          <fpage>1234</fpage>
          <lpage>1240</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/31501885"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/bioinformatics/btz682</pub-id>
          <pub-id pub-id-type="medline">31501885</pub-id>
          <pub-id pub-id-type="pii">5566506</pub-id>
          <pub-id pub-id-type="pmcid">PMC7703786</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Tinn</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Cheng</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Lucas</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Usuyama</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Naumann</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Gao</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Poon</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Domain-specific language model pretraining for biomedical natural language processing</article-title>
          <source>ACM Trans Comput Healthc</source>
          <year>2021</year>
          <month>10</month>
          <day>15</day>
          <volume>3</volume>
          <issue>1</issue>
          <fpage>1</fpage>
          <lpage>23</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1145/3458754"/>
          </comment>
          <pub-id pub-id-type="doi">10.1145/3458754</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mitra</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Rawat</surname>
              <given-names>BPS</given-names>
            </name>
            <name name-style="western">
              <surname>McManus</surname>
              <given-names>DD</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Relation classification for bleeding events from electronic health records using deep learning systems: an empirical study</article-title>
          <source>JMIR Med Inform</source>
          <year>2021</year>
          <month>07</month>
          <day>02</day>
          <volume>9</volume>
          <issue>7</issue>
          <fpage>e27527</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2021/7/e27527/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/27527</pub-id>
          <pub-id pub-id-type="medline">34255697</pub-id>
          <pub-id pub-id-type="pii">v9i7e27527</pub-id>
          <pub-id pub-id-type="pmcid">PMC8285744</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Jin</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Rawat</surname>
              <given-names>BPS</given-names>
            </name>
            <name name-style="western">
              <surname>Cai</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Fine-tuning Bidirectional Encoder Representations From Transformers (BERT)–based models on large-scale electronic health record notes: an empirical study</article-title>
          <source>JMIR Med Inform</source>
          <year>2019</year>
          <month>09</month>
          <day>12</day>
          <volume>7</volume>
          <issue>3</issue>
          <fpage>e14830</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2019/3/e14830/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/14830</pub-id>
          <pub-id pub-id-type="medline">31516126</pub-id>
          <pub-id pub-id-type="pii">v7i3e14830</pub-id>
          <pub-id pub-id-type="pmcid">PMC6746103</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Liao</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Kuo</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Chiu</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Lai</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Automatic ICD-10 coding and training system: deep neural network based on supervised learning</article-title>
          <source>JMIR Med Inform</source>
          <year>2021</year>
          <month>08</month>
          <day>31</day>
          <volume>9</volume>
          <issue>8</issue>
          <fpage>e23230</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2021/8/e23230/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/23230</pub-id>
          <pub-id pub-id-type="medline">34463639</pub-id>
          <pub-id pub-id-type="pii">v9i8e23230</pub-id>
          <pub-id pub-id-type="pmcid">PMC8441604</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Liao</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Lai</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>He</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Tsai</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Chiu</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Hung</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Automatic International Classification of Diseases coding system: deep contextualized language model with rule-based approaches</article-title>
          <source>JMIR Med Inform</source>
          <year>2022</year>
          <month>06</month>
          <day>29</day>
          <volume>10</volume>
          <issue>6</issue>
          <fpage>e37557</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2022/6/e37557/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/37557</pub-id>
          <pub-id pub-id-type="medline">35767353</pub-id>
          <pub-id pub-id-type="pii">v10i6e37557</pub-id>
          <pub-id pub-id-type="pmcid">PMC9282222</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>He</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Xia</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <person-group person-group-type="editor">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ng</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zan</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Joint binary neural network for multi-label learning with applications to emotion classification</article-title>
          <source>Natural Language Processing and Chinese Computing. NLPCC 2018. Lecture Notes in Computer Science, Vol 11108</source>
          <year>2018</year>
          <publisher-loc>Cham</publisher-loc>
          <publisher-name>Springer</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Du</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Peng</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Xiang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Tao</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>ML-Net: multi-label classification of biomedical texts with deep neural networks</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2019</year>
          <month>11</month>
          <day>01</day>
          <volume>26</volume>
          <issue>11</issue>
          <fpage>1279</fpage>
          <lpage>1285</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/31233120"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamia/ocz085</pub-id>
          <pub-id pub-id-type="medline">31233120</pub-id>
          <pub-id pub-id-type="pii">5522430</pub-id>
          <pub-id pub-id-type="pmcid">PMC7647240</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Glinka</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Woźniak</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Zakrzewska</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Multi-label medical text classification by feature selection</article-title>
          <year>2017</year>
          <conf-name>IEEE 26th International Conference on Enabling Technologies: Infrastructure for Collaborative Enterprises (WETICE)</conf-name>
          <conf-date>June 21-23, 2017</conf-date>
          <conf-loc>Poznan, Poland</conf-loc>
          <fpage>176</fpage>
          <lpage>181</lpage>
          <pub-id pub-id-type="doi">10.1109/wetice.2017.42</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hughes</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Kotoulas</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Suzumura</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Medical text classification using convolutional neural networks</article-title>
          <source>arXiv:1704.06841v1 [cs.CL]</source>
          <comment>Preprint posted online April 22, 2017.</comment>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.48550/arXiv.1704.06841"/>
          </comment>
          <pub-id pub-id-type="doi">10.48550/arXiv.1704.06841</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref49">
        <label>49</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yogarajan</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Montiel</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Pfahringer</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Seeing the whole patient: using multi-label medical text classification techniques to enhance predictions of medical codes</article-title>
          <source>arXiv:2004.00430v1 [cs.IR]</source>
          <comment>Preprint posted online March 29, 2020.</comment>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.48550/arXiv.2004.00430"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref50">
        <label>50</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wasim</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Asim</surname>
              <given-names>MN</given-names>
            </name>
            <name name-style="western">
              <surname>Ghani Khan</surname>
              <given-names>MU</given-names>
            </name>
            <name name-style="western">
              <surname>Mahmood</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>Multi-label biomedical question classification for lexical answer type prediction</article-title>
          <source>J Biomed Inform</source>
          <year>2019</year>
          <month>05</month>
          <volume>93</volume>
          <fpage>103143</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(19)30061-9"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2019.103143</pub-id>
          <pub-id pub-id-type="medline">30872137</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(19)30061-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref51">
        <label>51</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Baumel</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Nassour-Kassis</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Cohen</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Elhadad</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Elhadad</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Multi-label classification of patient notes: case study on ICD code assignment</article-title>
          <source>arXiv:1709.09587v3 [cs.CL] </source>
          <comment>Preprint posted online September 27, 2012.</comment>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.48550/arXiv.1709.09587"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref52">
        <label>52</label>
        <nlm-citation citation-type="web">
          <article-title>Cancer type list</article-title>
          <source>International Cancer Research Partnership</source>
          <access-date>2023-09-09</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.icrpartnership.org/cancer-type-list">https://www.icrpartnership.org/cancer-type-list</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref53">
        <label>53</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bryant</surname>
              <given-names>RE</given-names>
            </name>
            <name name-style="western">
              <surname>O'Hallaron</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <source>Computer Systems: A Programmer's Perspective (3rd Edition)</source>
          <year>2016</year>
          <publisher-loc>London, UK</publisher-loc>
          <publisher-name>Pearson</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref54">
        <label>54</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Matsuo</surname>
              <given-names>Koji</given-names>
            </name>
            <name name-style="western">
              <surname>Mandelbaum</surname>
              <given-names>Rachel S</given-names>
            </name>
            <name name-style="western">
              <surname>Machida</surname>
              <given-names>Hiroko</given-names>
            </name>
            <name name-style="western">
              <surname>Yoshihara</surname>
              <given-names>Kosuke</given-names>
            </name>
            <name name-style="western">
              <surname>Matsuzaki</surname>
              <given-names>Shinya</given-names>
            </name>
            <name name-style="western">
              <surname>Klar</surname>
              <given-names>Maximilian</given-names>
            </name>
            <name name-style="western">
              <surname>Muggia</surname>
              <given-names>Franco M</given-names>
            </name>
            <name name-style="western">
              <surname>Roman</surname>
              <given-names>Lynda D</given-names>
            </name>
            <name name-style="western">
              <surname>Wright</surname>
              <given-names>Jason D</given-names>
            </name>
          </person-group>
          <article-title>Temporal trends of subsequent breast cancer among women with ovarian cancer: a population-based study</article-title>
          <source>Arch Gynecol Obstet</source>
          <year>2020</year>
          <month>05</month>
          <volume>301</volume>
          <issue>5</issue>
          <fpage>1235</fpage>
          <lpage>1245</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/32206877"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s00404-020-05508-3</pub-id>
          <pub-id pub-id-type="medline">32206877</pub-id>
          <pub-id pub-id-type="pii">10.1007/s00404-020-05508-3</pub-id>
          <pub-id pub-id-type="pmcid">PMC7528443</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref55">
        <label>55</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Chang</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>Yali</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>Xin</given-names>
            </name>
            <name name-style="western">
              <surname>Mao</surname>
              <given-names>Feng</given-names>
            </name>
            <name name-style="western">
              <surname>Shen</surname>
              <given-names>Songjie</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>Ying</given-names>
            </name>
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>Qiang</given-names>
            </name>
          </person-group>
          <article-title>Clinical characteristics and survival outcomes of patients with both primary breast cancer and primary ovarian cancer</article-title>
          <source>Medicine (Baltimore)</source>
          <year>2020</year>
          <month>08</month>
          <day>07</day>
          <volume>99</volume>
          <issue>32</issue>
          <fpage>e21560</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/32769897"/>
          </comment>
          <pub-id pub-id-type="doi">10.1097/MD.0000000000021560</pub-id>
          <pub-id pub-id-type="medline">32769897</pub-id>
          <pub-id pub-id-type="pii">00005792-202008070-00038</pub-id>
          <pub-id pub-id-type="pmcid">PMC7593036</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref56">
        <label>56</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Woopen</surname>
              <given-names>Hannah</given-names>
            </name>
            <name name-style="western">
              <surname>Rolf</surname>
              <given-names>Carolin</given-names>
            </name>
            <name name-style="western">
              <surname>Braicu</surname>
              <given-names>Elena Ioana</given-names>
            </name>
            <name name-style="western">
              <surname>Buttmann-Schweiger</surname>
              <given-names>Nina</given-names>
            </name>
            <name name-style="western">
              <surname>Barnes</surname>
              <given-names>Benjamin</given-names>
            </name>
            <name name-style="western">
              <surname>Baum</surname>
              <given-names>Joanna</given-names>
            </name>
            <name name-style="western">
              <surname>Pietzner</surname>
              <given-names>Klaus</given-names>
            </name>
            <name name-style="western">
              <surname>Kraywinkel</surname>
              <given-names>Klaus</given-names>
            </name>
            <name name-style="western">
              <surname>Sehouli</surname>
              <given-names>Jalid</given-names>
            </name>
          </person-group>
          <article-title>Secondary malignancies in long-term ovarian cancer survivors: results of the 'Carolin meets HANNA' study</article-title>
          <source>Int J Gynecol Cancer</source>
          <year>2021</year>
          <month>05</month>
          <day>01</day>
          <volume>31</volume>
          <issue>5</issue>
          <fpage>709</fpage>
          <lpage>712</lpage>
          <pub-id pub-id-type="doi">10.1136/ijgc-2020-002155</pub-id>
          <pub-id pub-id-type="medline">33649156</pub-id>
          <pub-id pub-id-type="pii">ijgc-2020-002155</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref57">
        <label>57</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yun</surname>
              <given-names>E Hwa</given-names>
            </name>
            <name name-style="western">
              <surname>Hong</surname>
              <given-names>Seri</given-names>
            </name>
            <name name-style="western">
              <surname>Her</surname>
              <given-names>Eun Young</given-names>
            </name>
            <name name-style="western">
              <surname>Park</surname>
              <given-names>Bomi</given-names>
            </name>
            <name name-style="western">
              <surname>Suh</surname>
              <given-names>Mina</given-names>
            </name>
            <name name-style="western">
              <surname>Choi</surname>
              <given-names>Kui Son</given-names>
            </name>
            <name name-style="western">
              <surname>Jun</surname>
              <given-names>Jae Kwan</given-names>
            </name>
          </person-group>
          <article-title>Trends in Participation Rates of the National Cancer Screening Program among Cancer Survivors in Korea</article-title>
          <source>Cancers (Basel)</source>
          <year>2020</year>
          <month>12</month>
          <day>30</day>
          <volume>13</volume>
          <issue>1</issue>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=cancers13010081"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/cancers13010081</pub-id>
          <pub-id pub-id-type="medline">33396692</pub-id>
          <pub-id pub-id-type="pii">cancers13010081</pub-id>
          <pub-id pub-id-type="pmcid">PMC7796127</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref58">
        <label>58</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sato</surname>
              <given-names>Akira</given-names>
            </name>
            <name name-style="western">
              <surname>Matsubayashi</surname>
              <given-names>Keisuke</given-names>
            </name>
            <name name-style="western">
              <surname>Morishima</surname>
              <given-names>Toshitaka</given-names>
            </name>
            <name name-style="western">
              <surname>Nakata</surname>
              <given-names>Kayo</given-names>
            </name>
            <name name-style="western">
              <surname>Kawakami</surname>
              <given-names>Koji</given-names>
            </name>
            <name name-style="western">
              <surname>Miyashiro</surname>
              <given-names>Isao</given-names>
            </name>
          </person-group>
          <article-title>Increasing trends in the prevalence of prior cancer in newly diagnosed lung, stomach, colorectal, breast, cervical, and corpus uterine cancer patients: a population-based study</article-title>
          <source>BMC Cancer</source>
          <year>2021</year>
          <month>03</month>
          <day>10</day>
          <volume>21</volume>
          <issue>1</issue>
          <fpage>264</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmccancer.biomedcentral.com/articles/10.1186/s12885-021-08011-3"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12885-021-08011-3</pub-id>
          <pub-id pub-id-type="medline">33691661</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12885-021-08011-3</pub-id>
          <pub-id pub-id-type="pmcid">PMC7948331</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref59">
        <label>59</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wei</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Zeng</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Zheng</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>An</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Matsuda</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Bray</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>He</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Cancer registration in China and its role in cancer prevention and control</article-title>
          <source>The Lancet Oncology</source>
          <year>2020</year>
          <month>07</month>
          <volume>21</volume>
          <issue>7</issue>
          <fpage>e342</fpage>
          <lpage>e349</lpage>
          <pub-id pub-id-type="doi">10.1016/s1470-2045(20)30073-5</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref60">
        <label>60</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Qiu</surname>
              <given-names>Haibo</given-names>
            </name>
            <name name-style="western">
              <surname>Cao</surname>
              <given-names>Sumei</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>Ruihua</given-names>
            </name>
          </person-group>
          <article-title>Cancer incidence, mortality, and burden in China: a time-trend analysis and comparison with the United States and United Kingdom based on the global epidemiological data released in 2020</article-title>
          <source>Cancer Commun (Lond)</source>
          <year>2021</year>
          <month>10</month>
          <volume>41</volume>
          <issue>10</issue>
          <fpage>1037</fpage>
          <lpage>1048</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/34288593"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/cac2.12197</pub-id>
          <pub-id pub-id-type="medline">34288593</pub-id>
          <pub-id pub-id-type="pmcid">PMC8504144</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref61">
        <label>61</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hong</surname>
              <given-names>Young-Rock</given-names>
            </name>
            <name name-style="western">
              <surname>Huo</surname>
              <given-names>Jinhai</given-names>
            </name>
            <name name-style="western">
              <surname>Desai</surname>
              <given-names>Raj</given-names>
            </name>
            <name name-style="western">
              <surname>Cardel</surname>
              <given-names>Michelle</given-names>
            </name>
            <name name-style="western">
              <surname>Deshmukh</surname>
              <given-names>Ashish A</given-names>
            </name>
          </person-group>
          <article-title>Excess Costs and Economic Burden of Obesity-Related Cancers in the United States</article-title>
          <source>Value Health</source>
          <year>2019</year>
          <month>12</month>
          <volume>22</volume>
          <issue>12</issue>
          <fpage>1378</fpage>
          <lpage>1386</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1098-3015(19)32266-1"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jval.2019.07.004</pub-id>
          <pub-id pub-id-type="medline">31806194</pub-id>
          <pub-id pub-id-type="pii">S1098-3015(19)32266-1</pub-id>
          <pub-id pub-id-type="pmcid">PMC7313233</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref62">
        <label>62</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>Yong</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Peiyang</given-names>
            </name>
            <name name-style="western">
              <surname>Luo</surname>
              <given-names>Ganfeng</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Di</given-names>
            </name>
            <name name-style="western">
              <surname>Zou</surname>
              <given-names>Huachun</given-names>
            </name>
          </person-group>
          <article-title>Cancer attributable to human papillomavirus infection in China: Burden and trends</article-title>
          <source>Cancer</source>
          <year>2020</year>
          <month>08</month>
          <day>15</day>
          <volume>126</volume>
          <issue>16</issue>
          <fpage>3719</fpage>
          <lpage>3732</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://onlinelibrary.wiley.com/doi/10.1002/cncr.32986"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/cncr.32986</pub-id>
          <pub-id pub-id-type="medline">32484937</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref63">
        <label>63</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hong</surname>
              <given-names>Young-Rock</given-names>
            </name>
            <name name-style="western">
              <surname>Huo</surname>
              <given-names>Jinhai</given-names>
            </name>
            <name name-style="western">
              <surname>Desai</surname>
              <given-names>Raj</given-names>
            </name>
            <name name-style="western">
              <surname>Cardel</surname>
              <given-names>Michelle</given-names>
            </name>
            <name name-style="western">
              <surname>Deshmukh</surname>
              <given-names>Ashish A</given-names>
            </name>
          </person-group>
          <article-title>Excess Costs and Economic Burden of Obesity-Related Cancers in the United States</article-title>
          <source>Value Health</source>
          <year>2019</year>
          <month>12</month>
          <volume>22</volume>
          <issue>12</issue>
          <fpage>1378</fpage>
          <lpage>1386</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1098-3015(19)32266-1"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jval.2019.07.004</pub-id>
          <pub-id pub-id-type="medline">31806194</pub-id>
          <pub-id pub-id-type="pii">S1098-3015(19)32266-1</pub-id>
          <pub-id pub-id-type="pmcid">PMC7313233</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref64">
        <label>64</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fonnes</surname>
              <given-names>Tina</given-names>
            </name>
            <name name-style="western">
              <surname>Telle</surname>
              <given-names>Ingrid O</given-names>
            </name>
            <name name-style="western">
              <surname>Forsse</surname>
              <given-names>David</given-names>
            </name>
            <name name-style="western">
              <surname>Falck</surname>
              <given-names>Runa</given-names>
            </name>
            <name name-style="western">
              <surname>Trovik</surname>
              <given-names>Jone</given-names>
            </name>
            <name name-style="western">
              <surname>Haldorsen</surname>
              <given-names>Ingfrid S</given-names>
            </name>
            <name name-style="western">
              <surname>Krakstad</surname>
              <given-names>Camilla</given-names>
            </name>
          </person-group>
          <article-title>Cancer awareness in the general population varies with sex, age and media coverage: A population-based survey with focus on gynecologic cancers</article-title>
          <source>Eur J Obstet Gynecol Reprod Biol</source>
          <year>2021</year>
          <month>01</month>
          <volume>256</volume>
          <fpage>25</fpage>
          <lpage>31</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S0301-2115(20)30690-4"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.ejogrb.2020.10.051</pub-id>
          <pub-id pub-id-type="medline">33161211</pub-id>
          <pub-id pub-id-type="pii">S0301-2115(20)30690-4</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref65">
        <label>65</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kye</surname>
              <given-names>Su Yeon</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>Hyun Jeong</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>Yeonseung</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>Young Ae</given-names>
            </name>
          </person-group>
          <article-title>Public Attitudes towards Cancer Survivors among Korean Adults</article-title>
          <source>Cancer Res Treat</source>
          <year>2020</year>
          <month>07</month>
          <volume>52</volume>
          <issue>3</issue>
          <fpage>722</fpage>
          <lpage>729</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/32054152"/>
          </comment>
          <pub-id pub-id-type="doi">10.4143/crt.2019.265</pub-id>
          <pub-id pub-id-type="medline">32054152</pub-id>
          <pub-id pub-id-type="pii">crt.2019.265</pub-id>
          <pub-id pub-id-type="pmcid">PMC7373876</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref66">
        <label>66</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Curado</surname>
              <given-names>Maria Paula</given-names>
            </name>
          </person-group>
          <article-title>Importance of hospital cancer registries in Africa</article-title>
          <source>Ecancermedicalscience</source>
          <year>2019</year>
          <volume>13</volume>
          <fpage>948</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/31552121"/>
          </comment>
          <pub-id pub-id-type="doi">10.3332/ecancer.2019.948</pub-id>
          <pub-id pub-id-type="medline">31552121</pub-id>
          <pub-id pub-id-type="pii">can-13-948</pub-id>
          <pub-id pub-id-type="pmcid">PMC6722112</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref67">
        <label>67</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Lei</given-names>
            </name>
            <name name-style="western">
              <surname>Hao</surname>
              <given-names>Xiaomeng</given-names>
            </name>
            <name name-style="western">
              <surname>Song</surname>
              <given-names>Zian</given-names>
            </name>
            <name name-style="western">
              <surname>Zhi</surname>
              <given-names>Xiangcheng</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Sheng</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Jin</given-names>
            </name>
          </person-group>
          <article-title>Correlation between family history and characteristics of breast cancer</article-title>
          <source>Sci Rep</source>
          <year>2021</year>
          <month>03</month>
          <day>18</day>
          <volume>11</volume>
          <issue>1</issue>
          <fpage>6360</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41598-021-85899-8"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41598-021-85899-8</pub-id>
          <pub-id pub-id-type="medline">33737705</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41598-021-85899-8</pub-id>
          <pub-id pub-id-type="pmcid">PMC7973811</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref68">
        <label>68</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rantala</surname>
              <given-names>Jasmiina N J</given-names>
            </name>
            <name name-style="western">
              <surname>Heikkinen</surname>
              <given-names>Sanna M M</given-names>
            </name>
            <name name-style="western">
              <surname>Hirvonen</surname>
              <given-names>Elli M</given-names>
            </name>
            <name name-style="western">
              <surname>Tanskanen</surname>
              <given-names>Tomas</given-names>
            </name>
            <name name-style="western">
              <surname>Malila</surname>
              <given-names>Nea K</given-names>
            </name>
            <name name-style="western">
              <surname>Pitkäniemi</surname>
              <given-names>Janne M</given-names>
            </name>
          </person-group>
          <article-title>Familial aggregation of early-onset cancers in early-onset breast cancer families</article-title>
          <source>Int J Cancer</source>
          <year>2023</year>
          <month>07</month>
          <day>15</day>
          <volume>153</volume>
          <issue>2</issue>
          <fpage>331</fpage>
          <lpage>340</lpage>
          <pub-id pub-id-type="doi">10.1002/ijc.34538</pub-id>
          <pub-id pub-id-type="medline">37074269</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref69">
        <label>69</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ho</surname>
              <given-names>Yu Rong</given-names>
            </name>
            <name name-style="western">
              <surname>Ma</surname>
              <given-names>Shang-Pin</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>Kuan Y</given-names>
            </name>
          </person-group>
          <article-title>Trends in regional cancer mortality in Taiwan 1992-2014</article-title>
          <source>Cancer Epidemiol</source>
          <year>2019</year>
          <month>04</month>
          <volume>59</volume>
          <fpage>185</fpage>
          <lpage>192</lpage>
          <pub-id pub-id-type="doi">10.1016/j.canep.2019.02.005</pub-id>
          <pub-id pub-id-type="medline">30825841</pub-id>
          <pub-id pub-id-type="pii">S1877-7821(18)30146-2</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref70">
        <label>70</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>Dong-Sook</given-names>
            </name>
            <name name-style="western">
              <surname>Ahn</surname>
              <given-names>Hyeong Sik</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>Hyun Jung</given-names>
            </name>
          </person-group>
          <article-title>Statin use and incidence and mortality of breast and gynecology cancer: A cohort study using the National Health Insurance claims database</article-title>
          <source>Int J Cancer</source>
          <year>2022</year>
          <month>04</month>
          <day>01</day>
          <volume>150</volume>
          <issue>7</issue>
          <fpage>1156</fpage>
          <lpage>1165</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://onlinelibrary.wiley.com/doi/10.1002/ijc.33869"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/ijc.33869</pub-id>
          <pub-id pub-id-type="medline">34751444</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref71">
        <label>71</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Collins</surname>
              <given-names>Julie M</given-names>
            </name>
            <name name-style="western">
              <surname>Isaacs</surname>
              <given-names>Claudine</given-names>
            </name>
          </person-group>
          <article-title>Management of breast cancer risk in BRCA1/2 mutation carriers who are unaffected with cancer</article-title>
          <source>Breast J</source>
          <year>2020</year>
          <month>08</month>
          <volume>26</volume>
          <issue>8</issue>
          <fpage>1520</fpage>
          <lpage>1527</lpage>
          <pub-id pub-id-type="doi">10.1111/tbj.13970</pub-id>
          <pub-id pub-id-type="medline">32652823</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref72">
        <label>72</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Qiang</surname>
              <given-names>Judy K</given-names>
            </name>
            <name name-style="western">
              <surname>Lipscombe</surname>
              <given-names>Lorraine L</given-names>
            </name>
            <name name-style="western">
              <surname>Lega</surname>
              <given-names>Iliana C</given-names>
            </name>
          </person-group>
          <article-title>Association between diabetes, obesity, aging, and cancer: review of recent literature</article-title>
          <source>Transl Cancer Res</source>
          <year>2020</year>
          <month>09</month>
          <volume>9</volume>
          <issue>9</issue>
          <fpage>5743</fpage>
          <lpage>5759</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/35117936"/>
          </comment>
          <pub-id pub-id-type="doi">10.21037/tcr.2020.03.14</pub-id>
          <pub-id pub-id-type="medline">35117936</pub-id>
          <pub-id pub-id-type="pii">tcr-09-09-5743</pub-id>
          <pub-id pub-id-type="pmcid">PMC8797908</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref73">
        <label>73</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dyba</surname>
              <given-names>Tadeusz</given-names>
            </name>
            <name name-style="western">
              <surname>Randi</surname>
              <given-names>Giorgia</given-names>
            </name>
            <name name-style="western">
              <surname>Bray</surname>
              <given-names>Freddie</given-names>
            </name>
            <name name-style="western">
              <surname>Martos</surname>
              <given-names>Carmen</given-names>
            </name>
            <name name-style="western">
              <surname>Giusti</surname>
              <given-names>Francesco</given-names>
            </name>
            <name name-style="western">
              <surname>Nicholson</surname>
              <given-names>Nicholas</given-names>
            </name>
            <name name-style="western">
              <surname>Gavin</surname>
              <given-names>Anna</given-names>
            </name>
            <name name-style="western">
              <surname>Flego</surname>
              <given-names>Manuela</given-names>
            </name>
            <name name-style="western">
              <surname>Neamtiu</surname>
              <given-names>Luciana</given-names>
            </name>
            <name name-style="western">
              <surname>Dimitrova</surname>
              <given-names>Nadya</given-names>
            </name>
            <name name-style="western">
              <surname>Negrão Carvalho</surname>
              <given-names>Raquel</given-names>
            </name>
            <name name-style="western">
              <surname>Ferlay</surname>
              <given-names>Jacques</given-names>
            </name>
            <name name-style="western">
              <surname>Bettio</surname>
              <given-names>Manola</given-names>
            </name>
          </person-group>
          <article-title>The European cancer burden in 2020: Incidence and mortality estimates for 40 countries and 25 major cancers</article-title>
          <source>Eur J Cancer</source>
          <year>2021</year>
          <month>11</month>
          <volume>157</volume>
          <fpage>308</fpage>
          <lpage>347</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S0959-8049(21)00497-4"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.ejca.2021.07.039</pub-id>
          <pub-id pub-id-type="medline">34560371</pub-id>
          <pub-id pub-id-type="pii">S0959-8049(21)00497-4</pub-id>
          <pub-id pub-id-type="pmcid">PMC8568058</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
