<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMI</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Med Inform</journal-id>
      <journal-title>JMIR Medical Informatics</journal-title>
      <issn pub-type="epub">2291-9694</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v9i11e30356</article-id>
      <article-id pub-id-type="pmid">34747707</article-id>
      <article-id pub-id-type="doi">10.2196/30356</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Health Information Needs of Young Chinese People Based on an Online Health Community: Topic and Statistical Analysis</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Lovis</surname>
            <given-names>Christian</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Xu</surname>
            <given-names>Stanley</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Wei</surname>
            <given-names>Shanzun</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Wang</surname>
            <given-names>Jie</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>School of Management</institution>
            <institution>Capital Normal University</institution>
            <addr-line>No. 56 Xisanhuan North Rd, Haidian District</addr-line>
            <addr-line>Beijing, 100089</addr-line>
            <country>China</country>
            <phone>86 01068901018</phone>
            <email>wangjie@cnu.edu.cn</email>
          </address>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-1262-6719</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Wang</surname>
            <given-names>Xin</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-8639-3818</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Wang</surname>
            <given-names>Lei</given-names>
          </name>
          <degrees>MS</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-6538-0193</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Peng</surname>
            <given-names>Yan</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-5003-6923</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>School of Management</institution>
        <institution>Capital Normal University</institution>
        <addr-line>Beijing</addr-line>
        <country>China</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>State key Laboratory of Networking and Switching Technology</institution>
        <institution>Beijing University of Posts and Telecommunications</institution>
        <addr-line>Beijing</addr-line>
        <country>China</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Department of Electrical and Computer Engineering</institution>
        <institution>The State University of New York at Stony Brook</institution>
        <addr-line>Stony Brook, NY</addr-line>
        <country>United States</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Jie Wang <email>wangjie@cnu.edu.cn</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <month>11</month>
        <year>2021</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>8</day>
        <month>11</month>
        <year>2021</year>
      </pub-date>
      <volume>9</volume>
      <issue>11</issue>
      <elocation-id>e30356</elocation-id>
      <history>
        <date date-type="received">
          <day>12</day>
          <month>5</month>
          <year>2021</year>
        </date>
        <date date-type="rev-request">
          <day>6</day>
          <month>7</month>
          <year>2021</year>
        </date>
        <date date-type="rev-recd">
          <day>30</day>
          <month>8</month>
          <year>2021</year>
        </date>
        <date date-type="accepted">
          <day>25</day>
          <month>9</month>
          <year>2021</year>
        </date>
      </history>
      <copyright-statement>©Jie Wang, Xin Wang, Lei Wang, Yan Peng. Originally published in JMIR Medical Informatics (https://medinform.jmir.org), 08.11.2021.</copyright-statement>
      <copyright-year>2021</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Informatics, is properly cited. The complete bibliographic information, a link to the original publication on https://medinform.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://medinform.jmir.org/2021/11/e30356" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>The internet has been widely accessible and well accepted by young people; however, there is a limited understanding of the internet usage patterns and characteristics on issues related to health problems. The contents posted on online health communities (OHCs) are valuable resources to learn about youth's health information needs.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>In this study, we concurrently exploited statistical analysis and topic analysis of online health information needs to explore the distribution, impact factors, and topics of interest relevant to Chinese young people.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>We collected 60,478 health-related data sets posted by young people from a well-known Chinese OHC named xywy.com. Descriptive statistical analysis and correlation analysis were applied to find the distribution and influence factors of the information needs of Chinese young people. Furthermore, a general 4-step topic mining strategy was presented for sparse short texts, which included sentence vectorization, dimension reduction, clustering, and keyword generation.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>In the Chinese OHC, Chinese young people had a high demand for information in the areas of gynecology and obstetrics, internal medicine, dermatology, plastic surgery, and surgery, and they focused on topics such as treatment, symptoms, causes, pathology, and diet. Females accounted for 69.67% (42,136/60,478) and young adults accounted for 87.44% (52,882/60,478) of all data. Gender, age, and disease type all had a significant effect on young people's information needs and topic preferences (<italic>P</italic>&#60;.001).</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>We conducted comprehensive analyses to discover the online health information needs of Chinese young people. The research findings are of great practical value to carry out health education and health knowledge dissemination inside and outside of schools according to the interests of youth, enable the innovation of information services in OHCs, and improve the health literacy of young people.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>information needs</kwd>
        <kwd>young people</kwd>
        <kwd>online health community</kwd>
        <kwd>topic analysis</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <sec>
        <title>Background</title>
        <p>To live a healthy life, people may pay greater attention to the information related to physical and mental health, disease, nutrition, and health protection. Heath information can guide health and clinical behaviors [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref2">2</xref>], and the availability of the internet makes it convenient to retrieve health-related information [<xref ref-type="bibr" rid="ref3">3</xref>]. According to the search behavior report on popular science needs of Chinese citizens in 2018 [<xref ref-type="bibr" rid="ref4">4</xref>], health and medical science rank the first in the search index among the popular science topics concerned, with a search proportion of 66.8%. The large number of users and the convenience of information access make online health communities (OHCs) one of the most important sources for searching and exchanging health-related information, experiences, advice, support, and opinions [<xref ref-type="bibr" rid="ref5">5</xref>]. The large-scale sharing of health information also makes OHCs a valuable and abundant source of data for addressing public health questions [<xref ref-type="bibr" rid="ref6">6</xref>]. Therefore, user-generated content in OHCs is one of the most direct and convenient ways of learning the topics of interest for users [<xref ref-type="bibr" rid="ref7">7</xref>].</p>
        <p>Young people are the future and the hope of all nations, thus promoting the health of young people is an important part of the strategy of a healthy China. Youth aged between 10 to 19 years face a range of health risks and this age is an important developmental period when health behaviors, values, and attitudes are established; these are often carried into adulthood [<xref ref-type="bibr" rid="ref8">8</xref>]. According to the definition of young people from World Health Organization (WHO), we defined those between 10 and 25 years of age as young people, and within this group, those between 18 and 25 years old as young adults and those between 10 and 17 years old as minors, to provide a deeper understanding of the characteristics of health-related internet usage for this important age group [<xref ref-type="bibr" rid="ref9">9</xref>].</p>
        <p>Although the internet is widely accessible and well accepted by young people, there is a limited understanding of internet usage patterns and characteristics on issues related to health problems [<xref ref-type="bibr" rid="ref10">10</xref>]. Despite the importance, little progress has been made to meet the need of providing online health information. Research on young people’s online health mostly rely on data collected from questionnaire surveys or interviews, with the number of data samples being fewer than 1000 [<xref ref-type="bibr" rid="ref11">11</xref>-<xref ref-type="bibr" rid="ref13">13</xref>]. These can hardly be expected to represent the actual information needs of young people. The related data analyses have been mostly based on basic statistics and correlation of questionnaire data and interview data [<xref ref-type="bibr" rid="ref13">13</xref>-<xref ref-type="bibr" rid="ref15">15</xref>], and few studies have been performed with the aim of understanding the user-generated content through natural language processing (NLP) techniques to discover the topics and interests of youth.</p>
        <p>The analysis of content of online health information, however, is very hard. The user-generated question and answer text data in OHC is often short in length and sparse in content, and the sparsity in short-text documents poses great challenges for topic analysis. Classic topic models such as latent Dirichlet allocation [<xref ref-type="bibr" rid="ref16">16</xref>] and probabilistic latent semantic analysis [<xref ref-type="bibr" rid="ref17">17</xref>] fail to work effectively due to the lack of word co-occurrence patterns in each short document [<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref19">19</xref>]. Another feasible way to realize topic analysis for short text is based on word embedding models, such as Word2Vec [<xref ref-type="bibr" rid="ref20">20</xref>]. However, such models usually use static coding methods and only consider the local information of the text. Without the overall information, this method cannot distinguish feature words by context semantics [<xref ref-type="bibr" rid="ref21">21</xref>]. In addition, because of the sparsity, the feature vector cannot represent the semantics of short text well.</p>
      </sec>
      <sec>
        <title>Related Work</title>
        <p>In this section, we summarize the related work that investigated the online health information need of young people, including the work on data collection, data analysis methods, and the discovered topics.</p>
        <p>The growth of the internet has made health information more accessible than ever before [<xref ref-type="bibr" rid="ref22">22</xref>]. For young people, the daily internet access rate is generally high, and the internet has become an important resource to support their self-care and health-related activities and services [<xref ref-type="bibr" rid="ref10">10</xref>].</p>
        <p>Many studies have been made to understand the online health information needs of young people. The data collection approaches used include questionnaire survey, interview, and web crawler collection [<xref ref-type="bibr" rid="ref23">23</xref>-<xref ref-type="bibr" rid="ref25">25</xref>]. The corresponding data analysis methods are also different. For the questionnaires and survey data, descriptive statistical analysis, correlation analysis, and multiple logistic regression analysis are generally applied [<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref14">14</xref>]. For interview data, many studies use content analysis and statistical analysis [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref15">15</xref>]. Recently, with the increase of user-generated content from OHCs, social media, and health service websites, some researchers have begun to collect data through web crawler and to develop text mining techniques, such as topic analysis and sentiment analysis, to discover user health information needs [<xref ref-type="bibr" rid="ref26">26</xref>-<xref ref-type="bibr" rid="ref28">28</xref>]. For example, text mining technology was used to analyze the pregnancy data of MedHelp in OHCs, and the adopted and unused answers were classified with a support vector machine–radial basis function kernel classification algorithm [<xref ref-type="bibr" rid="ref26">26</xref>]. Based on the extracted information of 1000 consultation records from one OHC, the features of the health information needs of patients with hypertension were explored by content analysis and clustering analysis [<xref ref-type="bibr" rid="ref28">28</xref>].</p>
        <p>A variety of studies have been conducted to find the topics of interest of young people from online health information [<xref ref-type="bibr" rid="ref10">10</xref>]. The results indicate that most online health information is closely related to the self-development of young people. The topics include daily health-related issues [<xref ref-type="bibr" rid="ref29">29</xref>-<xref ref-type="bibr" rid="ref31">31</xref>], physical growth [<xref ref-type="bibr" rid="ref13">13</xref>], mental health [<xref ref-type="bibr" rid="ref32">32</xref>,<xref ref-type="bibr" rid="ref33">33</xref>], sexual and reproductive health [<xref ref-type="bibr" rid="ref34">34</xref>-<xref ref-type="bibr" rid="ref36">36</xref>], and physiological diseases [<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref37">37</xref>]. Daily health-related issues, such as exercise and nutrition, beauty and skin care, fitness and diet, flu, and infection draw significant attention from young people [<xref ref-type="bibr" rid="ref29">29</xref>]. They also use internet information on symptoms and treatment options for physiological diseases, such as arthritis or diabetes, and may turn to alternative sources according to the topic [<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref37">37</xref>]. Young people who experience mental health issues often seek help and information related to their psychosocial health and advice from peers or doctors online [<xref ref-type="bibr" rid="ref24">24</xref>,<xref ref-type="bibr" rid="ref34">34</xref>]. For sexual health issues, both males and females are likely to look for information and help about such sensitive topics [<xref ref-type="bibr" rid="ref24">24</xref>,<xref ref-type="bibr" rid="ref34">34</xref>]. The internet has become a major resource for young people in supporting their self-care and health-related activities and services. The actual needs of young people may vary across different countries or different age groups [<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref38">38</xref>,<xref ref-type="bibr" rid="ref39">39</xref>].</p>
        <p>Although many studies have been made on the online health information of young people, the number of samples for most is small and does not adequately reflect the general needs of youth. Moreover, previous studies have generally not been based on user-generated content nor have they used NLP technology to develop further research.</p>
      </sec>
      <sec>
        <title>Objective</title>
        <p>To fill the gap of current research, this paper presents a framework with a set of techniques to analyze online health information of interest to youth in China. The main contributions of this paper are the following.</p>
        <p>We propose a topic analysis scheme to extract information from short-text messages in 4 steps: sentence vectorization, dimension reduction, clustering, and keyword generation. We used the advanced pretrained Siamese network model sentence-BERT (SBERT) to generate high-quality sentence vectors and principal component analysis (PCA) to reduce the vector dimension for more effective clustering. These techniques can be extended to apply to other topic extraction tasks based on short texts from the internet.</p>
        <p>Concurrently exploiting statistical analysis and topic analysis, we also explored the distribution, impact factors, and topics of interest based on the online health information of Chinese young people posted on a popular Chinese OHC. The research findings are of great practical value to carry out health education and health knowledge dissemination inside and outside schools according to the interests of youth, enable the innovation of information services in OHCs, and improve the health literacy of young people.</p>
      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Study Design</title>
        <p>The overall research framework is displayed in <xref rid="figure1" ref-type="fig">Figure 1</xref>. It was divided into 4 major steps: input data preparation, data preprocessing, data analysis, and findings discussion. Among these, the data analysis consisted of 2 parts: statistical analysis and topic analysis. The statistical analysis part applied descriptive statistical analysis and correlation analysis to find the distribution and major factors related to Chinese youth’s information needs. Meanwhile, the topic analysis part used a 4-step strategy to mine the topics of specific diseases. In the 4-step topic extraction strategy, the first step used the representative pretrained language model SBERT to realize the sentence vectorization. The PCA algorithm was then used to reduce the vector dimension to improve the clustering efficiency and accuracy. After the optimal number of clusters was determined by the silhouette coefficient, a <italic>k</italic>-means clustering algorithm was adopted to get <italic>k</italic> clusters, term frequency–inverse document frequency (TF-IDF) was applied to acquire the keywords of each cluster, and the information needs topics were generated.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Research framework. OHC: online health community; PCA: principal component analysis; Q&#38;A: question and answer; SBERT: sentence-BERT; TF–IDF: term frequency–inverse document frequency.</p>
          </caption>
          <graphic xlink:href="medinform_v9i11e30356_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Input Data Preparation</title>
        <p>Our data set was collected by a web crawler from a popular Chinese OHC named xywy.com, which allows users to publish health-related questions in many different disease categories. xywy.com is one of the OHCs that had explored and implemented medical and health services in China earlier. As the pioneer of OHC, its completeness and accuracy of information content are widely recognized [<xref ref-type="bibr" rid="ref40">40</xref>].</p>
        <p>A total of 60,478 question and answer messages posted by young users from June 1, 2019, to June 1, 2020, were collected as input data. Each message contained a set of tags, including user gender, age, question time, department affiliation, question title, question content, and doctor’s responses.</p>
      </sec>
      <sec>
        <title>Data Preprocessing</title>
        <p>There were 2 important steps in data preprocessing: word segmentation and removing stop words. As the data source in this study was closely related to medical and health terms, the accuracy of word segmentation could be improved by combining them with a Chinese medical thesaurus. In this study, the Jieba library and Chinese medical thesaurus, CMesh [<xref ref-type="bibr" rid="ref41">41</xref>], were used together to facilitate the word segmentation.</p>
        <p>Removing the stop words that convey little useful meaning can reduce the dimension of the feature space [<xref ref-type="bibr" rid="ref42">42</xref>]. Therefore, after applying the Baidu stop-word table, we removed all stop words, including articles, conjunctions, pronouns, and linking verbs.</p>
      </sec>
      <sec>
        <title>Topic Extraction Strategies</title>
        <p>We created a set of questions about a specific disease, <italic>Q</italic>= {<italic>q</italic><sub>1</sub>, <italic>q</italic><sub>2</sub>, …<italic>q</italic><sub>&#124;Q&#124;</sub>}. It contained &#124;Q&#124; questions, and <italic>q<sub>i</sub></italic> was the <italic>i</italic>-th question in <italic>Q</italic>. For topic extraction from <italic>Q</italic>, we needed to first cluster questions in <italic>Q</italic> into <italic>k</italic> clusters <italic>C<sub>1</sub>, C<sub>2</sub>,</italic> …<italic>C<sub>k</sub></italic>, and then generate <italic>N</italic> key words to provide the topic of cluster <italic>C<sub>j</sub></italic>.</p>
        <sec>
          <title>Sentence Vectorization</title>
          <p>To extract topics from <italic>Q</italic>, the first thing was to represent the short question text data <italic>q<sub>i</sub></italic> in <italic>Q</italic> with an appropriate form to calculate the distance between question texts. As mentioned earlier, standard topic models and general word embedding methods were not suitable for this task. Therefore, we applied an effective pretrained NLP model in this step.</p>
          <p>BERT [<xref ref-type="bibr" rid="ref43">43</xref>] is now widely used in various NLP tasks. However, the sentence representation generated by BERT is not efficient for a clustering purpose. As BERT requires 2 sentences to be entered into the model at the same time for information interaction when calculating semantic similarity, it results in a significant computational overhead, and experiments [<xref ref-type="bibr" rid="ref44">44</xref>] have shown the results to usually be even worse than those of some word-embeddings models.</p>
          <p>Instead, we chose the improved pretrained model SBERT [<xref ref-type="bibr" rid="ref44">44</xref>] to generate sentence vectors for the question text in <italic>Q</italic>. As shown in <xref rid="figure2" ref-type="fig">Figure 2</xref>, SBERT used Siamese network structure to generate semantically meaningful sentence vector representations. In the input stage, sentences <italic>q<sub>i</sub></italic> and <italic>q<sub>j</sub></italic> were each encoded by pretrained BERT. After that, the 2 sentences were normalized through a pooling layer to obtain the fixed-length vectors <italic>u</italic> and <italic>v</italic>. After this, the (<italic>u, v,</italic> &#124;<italic>u-v</italic>&#124;) concatenated by <italic>u</italic>, <italic>v</italic>, and &#124;<italic>u-v</italic>&#124; was passed through the softmax layer to acquire the classification labels of the 2 sentence vectors, where &#124;<italic>u-v</italic>&#124; denoted the element-wise difference between <italic>u</italic> and <italic>v</italic>. SBERT directly used the cosine similarity to compare the similarity between 2 sentence vectors, which greatly improved the speed of inference while maintaining accuracy.</p>
          <fig id="figure2" position="float">
            <label>Figure 2</label>
            <caption>
              <p>The procedure of sentence vectorization based on sentence-BERT. CLS: a sign placed at the beginning of a sentence for subsequent classification tasks; SEP: a sign placed between 2 sentences to distinguish them; TOK: token embedding.</p>
            </caption>
            <graphic xlink:href="medinform_v9i11e30356_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
        <sec>
          <title>Dimension Reduction for Sentence Vectors</title>
          <p>After punctuation and invalid symbols were removed, <italic>q<sub>i</sub></italic> in <italic>Q</italic> had the average length of 45 Chinese characters. For each <italic>q<sub>i</sub></italic> in <italic>Q</italic>, SBERT generated a 512-dimension vector. A higher dimension causes more computation overhead and prevents the cluster algorithm from achieving better results on a relatively large input data set. We thus chose to use the PCA technique to reduce the vectors dimension, which is an effective method to process, compress, and extract information based on the covariance matrix of variables.</p>
          <p>To reduce the dimension of <italic>n</italic> <italic>m</italic>-dimensional vector matrix <italic>R<sup>n</sup></italic> <sup>×</sup> <italic><sup>m</sup></italic> generated by SBERT, we first calculated the eigenvalues and eigenvectors of the correlation matrix <italic>R</italic> of <italic>R<sup>n</sup></italic> <sup>×</sup> <italic><sup>m</sup></italic>, and then <italic>R<sup>n</sup></italic> <sup>×</sup> <italic><sup>m</sup></italic> was projected to the eigenvector space <italic>R<sup>n</sup></italic> <sup>×</sup> <italic><sup>k</sup></italic> corresponding to the first <italic>k</italic>-dominant eigenvalues whose cumulative contribution rate was <italic>λ</italic>. That is, the original vector was reduced from the <italic>m</italic>-dimension to the <italic>k</italic>-dimension.</p>
        </sec>
        <sec>
          <title>Sentence Vector Clustering</title>
          <p>For topic extraction, we first clustered sentence vectors output by SBERT. In this step, it is necessary to measure the distance (or similarity) between 2 sentence vectors and determine the number of clusters to form.</p>
          <p>In this study, all the sentence vectors generated by SBERT had the same length, and the cosine distance [<xref ref-type="bibr" rid="ref45">45</xref>] was used to measure the similarity between 2 sentence vectors. <italic>k</italic>-means clustering algorithm was then adopted to get <italic>k</italic> clusters, with each cluster being a topic for a specific disease.</p>
          <p>The clustering number <italic>k</italic> had an important influence on the clustering results of the <italic>k</italic>-means algorithm, and we used the silhouette coefficient [<xref ref-type="bibr" rid="ref46">46</xref>] to evaluate the clustering effect, which combined 2 factors, cluster intracohesion and cluster interdissimilarity.</p>
        </sec>
        <sec>
          <title>Generation Of Keywords</title>
          <p>Keywords needed to be generated to describe the topics of interest in different clusters. The representation method based on frequent values has often been used because it reduces the text dimension and has a better effect [<xref ref-type="bibr" rid="ref47">47</xref>]; we thus applied the TF-IDF algorithm [<xref ref-type="bibr" rid="ref48">48</xref>] to extract keywords from the clusters results.</p>
          <p>For each cluster <italic>C<sub>j</sub></italic>, TF-IDF was used to calculate the importance of words in <italic>C<sub>j</sub></italic>, and key words were selected based on the importance level of words. After the high word frequency in a cluster and the low text frequency in the disease question set were combined, the top <italic>N</italic> words with high word importance levels were selected to generate the topic words for a certain disease, and <italic>N</italic> was the user setting parameter. Thus, the topics of information needed for a certain disease were generated according to the topic words of each cluster.</p>
        </sec>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <p>We conducted a set of experiments over the real user-generated data set crawled online to reveal the distribution, influence factors, and topics of interest of Chinese young people.</p>
      <p>The models and algorithms in this paper were programmed based on Python 3.6 (Python Software Foundation) under the deep learning framework PyTorch 1.5.1 and TensorFlow 1.14.</p>
      <p>To evaluate the clustering effect for short-text based on the sentence vectors generated by BERT and SBERT, we selected 8701 samples from the whole data set that had disease labels from different departments. Experiment results showed that the clustering effect was significantly improved by SBERT, with adjusted Rand index [<xref ref-type="bibr" rid="ref49">49</xref>], adjusted mutual information [<xref ref-type="bibr" rid="ref50">50</xref>], and Fowlkes and Mallows index [<xref ref-type="bibr" rid="ref51">51</xref>] evaluation metric values of 32.1%, 28.6%, and 25.1% higher than those of BERT, respectively.</p>
      <sec>
        <title>The Results of Statistical Analysis</title>
        <p>The distribution of Chinese young people's interests based on the collected data of the health information is shown in <xref rid="figure3" ref-type="fig">Figure 3</xref>. Based on the percentage of the question data, the needs were mainly concentrated in gynecology and obstetrics, internal medicine, dermatology, plastic surgery, and surgery.</p>
        <p>Statistical data indicated that the ratio of female to male gender distribution was about 100:116.9 in China [<xref ref-type="bibr" rid="ref52">52</xref>]; however, the ratio of the number of questions raised by female to male users in our collected data was about 229.72 (n=42,136) to 100 (n=18,342), which showed that the young female users were more willing to use OHC for health consultation than were the male users. The results of the chi-square test between gender and departments showed that there were significant differences in health interest areas between different genders (<italic>X</italic><sup>2</sup><sub>1</sub><italic>=</italic>17004.9; <italic>P</italic>&#60;.001). As shown in <xref rid="figure4" ref-type="fig">Figure 4</xref>, the information needs of female users were mainly concentrated on the departments of gynecology and obstetrics, internal medicine, plastic surgery, and dermatology, while those of males were mainly focused on internal medicine, dermatology, andrology, and surgery. It could also be seen that both male and female young people tended to use the OHC to get help about sex-related issues, with females being more concerned about plastic and cosmetic issues and men being more concerned about surgical issues.</p>
        <p>In terms of age distribution, the willingness to access health information from the OHC appeared to increase as age increased. Young adults aged 18 to 25 years were the main group of young users in the OHC, accounting for 87.44% (52,882/60,478) of the total number. The results of the chi-square test between age and departments showed that there were significant differences in the health information need areas of young people at different ages (<italic>X</italic><sup>2</sup><sub>1</sub><italic>=</italic>4437.6; <italic>P</italic>&#60;.001). The department distribution of the needs at different ages is shown in Figure S1 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. The young adults’ needs were mainly concentrated on gynecology and obstetrics, internal medicine, dermatology, and plastic surgery, which was basically consistent with the overall distribution of needs. The information needs of minors were mainly in the areas of internal medicine, gynecology and obstetrics, dermatology, pediatrics, and preventive health care.</p>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>Distribution of Chinese young peoples’ health information needs.</p>
          </caption>
          <graphic xlink:href="medinform_v9i11e30356_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure4" position="float">
          <label>Figure 4</label>
          <caption>
            <p>Health information needs distribution of Chinese young people by gender.</p>
          </caption>
          <graphic xlink:href="medinform_v9i11e30356_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>The Results of Topic Analysis</title>
        <p>To further explore the topics of interests of Chinese young people related to health information, we first selected 5 representative diseases, including irregular menstruation, influenza, vitiligo, weight loss, and depression. After applying our 4-step topic extraction strategy, keywords were generated and topics were extracted for each selected disease. The top <italic>N</italic> key words of each cluster ranked by the word importance were selected to characterize the topics. Unless otherwise specified, <italic>N</italic> was set to 10 in this study.</p>
        <p>To better understand the experiment results, a table and word cloud were used to display the topic extraction results. The final topic extraction results of menstrual irregularities and weight loss are presented in <xref ref-type="table" rid="table1">Table 1</xref> and <xref ref-type="table" rid="table2">Table 2</xref>, the topics of vitiligo are presented in Table S1 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>, while the results of influenza and depression respect are shown in the form of word cloud in Figure S2 and Figure S3 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>, respectively. The keywords here eliminated words such as “vitiligo,” and “ influenza,” and other disease name words, such as well as “how” and “what,” along with other meaningless words.</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Topic extraction results for menstrual irregularities.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="100"/>
            <col width="130"/>
            <col width="390"/>
            <col width="380"/>
            <thead>
              <tr valign="top">
                <td>Topic</td>
                <td>Frequency, n (%) (N=1400)</td>
                <td>Concrete content</td>
                <td>Keywords (top 5)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Treatment</td>
                <td>625 (44.64)</td>
                <td>Consult for treatment of menstrual irregularities and medications</td>
                <td>Delay, how to treat, how to do, dysmenorrhea, causes</td>
              </tr>
              <tr valign="top">
                <td>Pathology</td>
                <td>84 (6.00)</td>
                <td>Consult for types, etiology, and pathology of menstrual irregularities</td>
                <td>What is going on, menstruation, bleeding, causes, brown</td>
              </tr>
              <tr valign="top">
                <td>Symptom</td>
                <td>242 (17.29)</td>
                <td>Consult for signs, symptoms, and tests of menstrual irregularities</td>
                <td>Delay, leucorrhea, examination, symptoms, feelings</td>
              </tr>
              <tr valign="top">
                <td>Pregnancy</td>
                <td>189 (13.50)</td>
                <td>Counseling whether menstrual irregularities are associated with pregnancy</td>
                <td>Pregnancy, have sexual intercourse, birth control pills, boyfriend, safety period</td>
              </tr>
              <tr valign="top">
                <td>Diet</td>
                <td>260 (18.57)</td>
                <td>Consult for menstrual irregularities, dietary contraindications and precautions, and suitability of certain foods</td>
                <td>What to eat, food, conditioning, diet, brown sugar</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Topic extraction results for weight loss.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="200"/>
            <col width="0"/>
            <col width="200"/>
            <col width="0"/>
            <col width="300"/>
            <col width="0"/>
            <col width="270"/>
            <thead>
              <tr valign="top">
                <td colspan="3">Topic</td>
                <td colspan="2">Frequency, n (%) (N=3381)</td>
                <td colspan="2">Concrete content</td>
                <td>Keywords (top 5)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="3">
                  <bold>Diet</bold>
                </td>
                <td colspan="2">2371 (70.11)</td>
                <td colspan="3">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Coarse grain</td>
                <td colspan="2">411 (12.16)</td>
                <td colspan="2">Counseling on coarse grain cereals that help lose weight, as well as consumption effects</td>
                <td colspan="2">Potatoes, sweet potatoes, corn, red beans, oats</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Fruits and vegetables</td>
                <td colspan="2">487 (14.40)</td>
                <td colspan="2">Counseling on fruits and vegetables that help you lose weight and how they work</td>
                <td colspan="2">Apples, fruits, bananas, cucumbers, bitter gourd</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Beverages</td>
                <td colspan="2">353 (10.44)</td>
                <td colspan="2">Counseling on various types of beverages that help with weight loss and how well they work</td>
                <td colspan="2">Yogurt, honey water, milk, diet tea, coffee</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Weight loss recipes</td>
                <td colspan="2">1120 (33.13)</td>
                <td colspan="2">Counseling on healthy recipes that help to lose weight</td>
                <td colspan="2">What to eat, how to eat, food, effect, dieting</td>
              </tr>
              <tr valign="top">
                <td colspan="3">Surgery</td>
                <td colspan="2">614 (18.16)</td>
                <td colspan="2">Counseling on various surgical weight loss methods, effects, and costs.</td>
                <td>Diet, treatment, liposuction, thin face pin, surgery, lipolysis, effect</td>
              </tr>
              <tr valign="top">
                <td colspan="3">Pathology</td>
                <td colspan="2">396 (11.71%)</td>
                <td colspan="2">Counseling on the causes of obesity and weight loss methods</td>
                <td> Obesity, getting fat, causing, sweets, why</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <p>Overall, the topics for all types of diseases were mainly focused on treatment, symptoms, pathology, and diet. For irregular menstruation, influenza, and vitiligo, young people were most concerned about the topic of treatment. Unlike other diseases for which users were mainly concerned about the treatment method, patients with vitiligo were also concerned about the treatment cost and location of treatment. Young people consulting on weight loss were most concerned about the role of diet in weight loss, including the information on how to choose diet recipes and the types of roughage grains, fruits and vegetables, and beverages that help with weight loss. In contrast to other physiological disorders, young people under the depression department were not concerned about the diet topic. They were more interested in symptoms than in treatment. The results of the chi-square test between the disease type and the information needs topic showed that there were significant differences in the topic of information needs between young people with physical and psychological disorders (<italic>X</italic><sup>2</sup><sub>1</sub><italic>=</italic>2591.7; <italic>P</italic>&#60;.001).</p>
        <p>The gender distribution of vitiligo and influenza is shown in Figure S4 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. The chi-square tests between young people's gender and information need topics in the data of influenza (<italic>X</italic><sup>2</sup><sub>1</sub><italic>=</italic>113.7; <italic>P</italic>&#60;.001), vitiligo (<italic>X</italic><sup>2</sup><sub>1</sub><italic>=</italic>100.6; <italic>P</italic>&#60;.001), weight loss (<italic>X</italic><sup>2</sup><sub>1</sub><italic>=</italic>49.0; <italic>P</italic>&#60;.001), and depression (<italic>X</italic><sup>2</sup><sub>1</sub><italic>=</italic>88.7; <italic>P</italic>&#60;.001) all indicate that there were significant differences in topics of interest in young people of different gender. In all 4 diseases, male young people asked more questions on the treatment topics and pathology topics than did females, and female young people asked more questions on the diet topics than did males.</p>
        <p>In <xref rid="figure5" ref-type="fig">Figure 5</xref>, we used the distribution map and radar chart to show the information needs topic distribution of different ages for menstrual irregularities. The chi-square tests of irregular menstruation (<italic>X</italic><sup>2</sup><sub>1</sub><italic>=</italic>44.4; <italic>P</italic>&#60;.001), influenza (<italic>X</italic><sup>2</sup><sub>1</sub><italic>=</italic>81.1; <italic>P</italic>&#60;.001), vitiligo (<italic>X</italic><sup>2</sup><sub>1</sub><italic>=</italic>64.2; <italic>P</italic>&#60;.001), weight loss (<italic>X</italic><sup>2</sup><sub>1</sub><italic>=</italic>157.5; <italic>P</italic>&#60;.001), and depression (<italic>X</italic><sup>2</sup><sub>1</sub><italic>=</italic>30.2; <italic>P</italic>&#60;.001) indicated that there were significant differences in health information needs of young people of different ages. In all the 5 selected diseases, young adults asked a higher proportion of questions on the topic of diet than did minors, indicating that young adults were more concerned about the topic of diet than were minors.</p>
        <fig id="figure5" position="float">
          <label>Figure 5</label>
          <caption>
            <p>(a) Distribution map of menstrual irregularities topic distribution at different age stages. (b) Radar chart of menstrual irregularities topic distribution at different age stages.</p>
          </caption>
          <graphic xlink:href="medinform_v9i11e30356_fig5.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>There are four principal findings in this study. First, Chinese young people's interests on online health information are mainly distributed in the following areas in descending order: gynecology and obstetrics, internal medicine, dermatology, plastic surgery, and surgery. It is worth noting that sexual and reproductive health issues are a concern of both Chinese male and female young people. The development of sexual organs and the awakening of sexual consciousness during adolescence likely lead young people to pay greater attention to health issues related to sexual organs and the reproductive system, including sexual organ development, urinary infection, and menstrual irregularities. However. because of the cultural background and relatively poor sex education level in China, young people are often shy to talk about sexual problems offline, so they hope to receive helpful information online [<xref ref-type="bibr" rid="ref53">53</xref>]. Young people have a high level of oil secretion in their skin, and bad habits and dietary habits are common, which not only affect the health of their skin but also the aesthetics of their appearance, so health information related to skin problems and cosmetic surgery is also urgently sought out by young people.</p>
        <p>Second, most young people in Chinese OHCs are female; this is because there are significant gender differences in the level of health awareness and attention to health information among young people in social media [<xref ref-type="bibr" rid="ref54">54</xref>], with females having a higher level of health awareness and attention to health information than males. Moreover, gender is an important factor affecting the need for health-related information for Chinese young people. Male young people are more concerned about treatment and pathology topics than are females, and female young people are more concerned about diet topics than are males. This is the same conclusion as that found by previous studies [<xref ref-type="bibr" rid="ref55">55</xref>], where male young people were significantly lower than females both in terms of their level of dietary health and awareness of a healthy diet.</p>
        <p>Third, young adults aged 18 to 25 year are the main group of young users in OHCs. This is because the number of young adults using the internet and OHCs is much larger than that of minors aged 10 to 17 years. As a group that has initially left the family and entered society, young adults lack parental care and help in health issues and are more willing to seek help in OHCs. There are also significant age differences in young people's health information needs in OHCs. Compared with young adults, the interest in gynecology and obstetrics is lower while the interest in pediatrics is higher among minors, and this difference is mainly determined by the developmental stage. Furthermore, young adults are more concerned with the topic of diet than are minors. This is because primary and secondary schools in China do not currently provided adequate dietary health education [<xref ref-type="bibr" rid="ref56">56</xref>], but as young people grow older, the channels for dietary health education expand, their knowledge of dietary health increases, and their awareness of the importance of healthy eating rises.</p>
        <p>Finally, for Chinese young people, the information needs mainly focus on treatment, symptoms, etiology, pathology, and diet, whereas less attention is paid to the topic of prevention. Meanwhile, there are significant differences for different disease types. For physiological diseases, such as irregular menstruation, influenza, and vitiligo, young people pay most attention in OHCs to the treatment to understand the treatment methods, costs, and hospital-related information. For mental diseases, such as depression, they are most concerned about the topic of symptoms, hoping the OHC can help them to judge whether they have the condition or not. This is because young people lack knowledge about psychological health and have difficulty in self-judging mental illness, so more young people are eager to seek help from doctors by describing their symptoms in OHCs to determine whether they have a psychological illness [<xref ref-type="bibr" rid="ref57">57</xref>].</p>
      </sec>
      <sec>
        <title>Theoretical Implications</title>
        <p>Based on real user-generated content, this study applied a web crawler, NLP, and statistical analysis technologies to comprehensively analyze Chinese youth's online information needs. This study attempted to reduce the deficiencies of the related literature, whose limitations included small research samples and relatively simple data analysis methods.</p>
        <p>To deal with the challenge of mining topics from a massive collection of sparse short text from the internet, we used a general 4-step topic mining strategy. Using an advanced pretraining model, SBERT, and PCA dimension reduction, we generated high-quality clusters for extracting the topic of health information needs. From a technical point of view, this scheme provides a good method of topic analysis for short texts collected from the internet. Furthermore, with minor changes, such as removing word segmentation in the data preprocessing step, it can be extended to apply to other similar tasks using English-language data from websites.</p>
        <p>Our study also found that there were significant differences between Chinese and other countries' youth in the distribution and topics of online health information needs, which may have important implications for other researchers by providing data support and a basis for further research on differentiation.</p>
      </sec>
      <sec>
        <title>Practical Implications</title>
        <p>Many practical implications could be derived from this study. First, the education of disease prevention for young people should be strengthened. The topic mining results of various diseases showed that youth pay the least attention to the topic of disease prevention, which indicates that schools, families, and internet health and service platforms including OHCs should pay more attention to the education and guidance of disease prevention for youth.</p>
        <p>As mentioned earlier, sexual and reproductive health were one of the most concerning fields for Chinese young people. Therefore, it is necessary to improve network management to guide youth in treating and understanding sex-related information on the internet. An effective way is to establish professional and authoritative sexual health–related knowledge platforms to provide scientific information to young people at different stages of development.</p>
        <p>Moreover, the information service mode of OHCs requires innovation. At present, most of the information service models of Chinese OHCs are centered on the aggregation and organization of health information resources, which ignores the needs of users to some extent and is challenged in providing accurate service. Therefore, databases on user's health information needs should be established based on the results from mining and analysis of their actual interests. Based on the OHCs’ service platform, information matching and precision service of the information resources and information needs databases should be realized, which will provide personalized information and health services for youth and other users.</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>This study has some limitations. First, the experimental data were collected from only a single website, and thus the data source setting was substantially limited. In future studies, we plan to collect a larger data set from different OHCs to ensure the research results are more comprehensive and reliable. Second, although the presented framework showed good results in topic mining tasks for short texts from the internet, there is still much room for improvement related to the clustering tasks in specialized domains, and our future work will integrate expertise in specific domains into the model to improve its performance.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>In this study, we conducted statistical analysis and topic analysis of online health information to explore the distribution, impact factors, and topics of interests of Chinese young people. A general topic analysis strategy using the pretraining model SBERT was proposed to extract high-quality topics based on large-scale sparse short texts from the internet. The research findings are helpful for health education departments to understand the real health-related needs of young people, carry out targeted education, and improve young people’s health literacy, and may be useful for OHCs to innovate and improve information service.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Related work.</p>
        <media xlink:href="medinform_v9i11e30356_app1.docx" xlink:title="DOCX File , 878 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">OHC</term>
          <def>
            <p>online health community</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">NLP</term>
          <def>
            <p>natural language processing</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">PCA</term>
          <def>
            <p>principal component analysis</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">TF-IDF</term>
          <def>
            <p>term frequency–inverse document frequency</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">SBERT</term>
          <def>
            <p>sentence-BERT</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">WHO</term>
          <def>
            <p>World Health Organization</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>This study was funded by the Beijing Natural Science Foundation(#1202020) and the Open Foundation of State Key Laboratory of Networking and Switching Technology (#SKLNST-2020-1-19). The funding body was not involved in the study design, data collection, data analysis, or writing of the manuscript.</p>
    </ack>
    <fn-group>
      <fn fn-type="con">
        <p>All authors were involved in the design of the study. JW led the drafting of the manuscript with assistance from XW, LW, and YP. LW implemented and tested the software used to collect data and perform the analyses. XW and YP supervised the project and revised the manuscript for important intellectual content. All authors read and agreed with the analysis and the manuscript.</p>
      </fn>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yuelin</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Wenjuan</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>A review of the studies on health information seeking behavior overseas</article-title>
          <source>Library and Information Service</source>
          <year>2012</year>
          <volume>19</volume>
          <fpage>128</fpage>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shi</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Qian</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Information needs of domestic and international hcqa users an empirical analysis</article-title>
          <source>Data Analysis and Knowledge Discovery</source>
          <year>2019</year>
          <volume>3</volume>
          <issue>5</issue>
          <fpage>2019</fpage>
          <lpage>10</lpage>
          <pub-id pub-id-type="doi">10.11925/infotech.2096-3467.2018.0813</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rowlands</surname>
              <given-names>IJ</given-names>
            </name>
            <name name-style="western">
              <surname>Loxton</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Dobson</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Mishra</surname>
              <given-names>GD</given-names>
            </name>
          </person-group>
          <article-title>Seeking health information online: association with young Australian women's physical, mental, and reproductive health</article-title>
          <source>J Med Internet Res</source>
          <year>2015</year>
          <month>05</month>
          <day>18</day>
          <volume>17</volume>
          <issue>5</issue>
          <fpage>e120</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2015/5/e120/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/jmir.4048</pub-id>
          <pub-id pub-id-type="medline">25986630</pub-id>
          <pub-id pub-id-type="pii">v17i5e120</pub-id>
          <pub-id pub-id-type="pmcid">PMC4468597</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <collab>China Association for Science and Technology</collab>
          </person-group>
          <source>The search behavior report on popular science needs of Chinese citizens in 2018</source>
          <access-date>2021-07-13</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.kepuchina.cn/more/201904/t20190416_1041674.shtml">http://www.kepuchina.cn/more/201904/t20190416_1041674.shtml</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Johnston</surname>
              <given-names>AC</given-names>
            </name>
            <name name-style="western">
              <surname>Worrell</surname>
              <given-names>JL</given-names>
            </name>
            <name name-style="western">
              <surname>Di Gangi</surname>
              <given-names>PM</given-names>
            </name>
            <name name-style="western">
              <surname>Wasko</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Online health communities: an assessment of the influence of participation on patient empowerment outcomes</article-title>
          <source>Info Technology &#38; People</source>
          <year>2013</year>
          <month>05</month>
          <day>31</day>
          <volume>26</volume>
          <issue>2</issue>
          <fpage>213</fpage>
          <lpage>235</lpage>
          <pub-id pub-id-type="doi">10.1108/ITP-02-2013-0040</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Conway</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Hu</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Chapman</surname>
              <given-names>WW</given-names>
            </name>
          </person-group>
          <article-title>Recent advances in using natural language processing to address public health research questions using social media and consumer generated data</article-title>
          <source>Yearb Med Inform</source>
          <year>2019</year>
          <month>08</month>
          <volume>28</volume>
          <issue>1</issue>
          <fpage>208</fpage>
          <lpage>217</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.thieme-connect.com/DOI/DOI?10.1055/s-0039-1677918"/>
          </comment>
          <pub-id pub-id-type="doi">10.1055/s-0039-1677918</pub-id>
          <pub-id pub-id-type="medline">31419834</pub-id>
          <pub-id pub-id-type="pmcid">PMC6697505</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kong</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>X</given-names>
            </name>
          </person-group>
          <article-title>Study on differences between patients with physiological and psychological diseases in online health communities: topic analysis and sentiment analysis</article-title>
          <source>Int J Environ Res Public Health</source>
          <year>2020</year>
          <month>02</month>
          <day>26</day>
          <volume>17</volume>
          <issue>5</issue>
          <fpage>1508</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=ijerph17051508"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/ijerph17051508</pub-id>
          <pub-id pub-id-type="medline">32111045</pub-id>
          <pub-id pub-id-type="pii">ijerph17051508</pub-id>
          <pub-id pub-id-type="pmcid">PMC7084206</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>McKinnon</surname>
              <given-names>KA</given-names>
            </name>
            <name name-style="western">
              <surname>H Y Caldwell</surname>
              <given-names>Patrina</given-names>
            </name>
            <name name-style="western">
              <surname>Scott</surname>
              <given-names>KM</given-names>
            </name>
          </person-group>
          <article-title>How adolescent patients search for and appraise online health information: A pilot study</article-title>
          <source>J Paediatr Child Health</source>
          <year>2020</year>
          <month>08</month>
          <volume>56</volume>
          <issue>8</issue>
          <fpage>1270</fpage>
          <lpage>1276</lpage>
          <pub-id pub-id-type="doi">10.1111/jpc.14918</pub-id>
          <pub-id pub-id-type="medline">32479676</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="web">
          <article-title>Orientation programme on adolescent health for health care providers</article-title>
          <source>World Health Organization</source>
          <access-date>2021-07-13</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://extranet.who.int/iris/restricted/handle/10665/42868">https://extranet.who.int/iris/restricted/handle/10665/42868</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Park</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Kwon</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Health-related internet use by children and adolescents: systematic review</article-title>
          <source>J Med Internet Res</source>
          <year>2018</year>
          <month>04</month>
          <day>03</day>
          <volume>20</volume>
          <issue>4</issue>
          <fpage>e120</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2018/4/e120/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/jmir.7731</pub-id>
          <pub-id pub-id-type="medline">29615385</pub-id>
          <pub-id pub-id-type="pii">v20i4e120</pub-id>
          <pub-id pub-id-type="pmcid">PMC5904452</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>SU</given-names>
            </name>
            <name name-style="western">
              <surname>Martinović</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Katavić</surname>
              <given-names>SS</given-names>
            </name>
          </person-group>
          <article-title>The use of mobile devices and applications for health information: A survey of Croatian students</article-title>
          <source>Journal of Librarianship and Information Science</source>
          <year>2019</year>
          <month>10</month>
          <day>22</day>
          <volume>52</volume>
          <issue>3</issue>
          <fpage>880</fpage>
          <lpage>894</lpage>
          <pub-id pub-id-type="doi">10.1177/0961000619880937</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hassan</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Masoud</surname>
              <given-names>O</given-names>
            </name>
          </person-group>
          <article-title>Online health information seeking and health literacy among non-medical college students: gender differences</article-title>
          <source>J Public Health (Berl.)</source>
          <year>2020</year>
          <month>03</month>
          <day>09</day>
          <fpage>1</fpage>
          <lpage>7</lpage>
          <pub-id pub-id-type="doi">10.1007/s10389-020-01243-w</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gaskin</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Anoshiravani</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Internet access and attitudes toward online personal health information among detained youth</article-title>
          <source>Journal of Adolescent Health</source>
          <year>2012</year>
          <month>2</month>
          <volume>50</volume>
          <issue>2</issue>
          <fpage>S91</fpage>
          <pub-id pub-id-type="doi">10.1016/j.jadohealth.2011.10.239</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wartella</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Rideout</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Montague</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Beaudoin-Ryan</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Lauricella</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Teens, health and technology: a national survey</article-title>
          <source>MaC</source>
          <year>2016</year>
          <month>06</month>
          <day>16</day>
          <volume>4</volume>
          <issue>3</issue>
          <fpage>13</fpage>
          <lpage>23</lpage>
          <pub-id pub-id-type="doi">10.17645/mac.v4i3.515</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Patterson</surname>
              <given-names>SP</given-names>
            </name>
            <name name-style="western">
              <surname>Hilton</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Flowers</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>McDaid</surname>
              <given-names>LM</given-names>
            </name>
          </person-group>
          <article-title>What are the barriers and challenges faced by adolescents when searching for sexual health information on the internet? Implications for policy and practice from a qualitative study</article-title>
          <source>Sex Transm Infect</source>
          <year>2019</year>
          <month>09</month>
          <volume>95</volume>
          <issue>6</issue>
          <fpage>462</fpage>
          <lpage>467</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/31040251"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/sextrans-2018-053710</pub-id>
          <pub-id pub-id-type="medline">31040251</pub-id>
          <pub-id pub-id-type="pii">sextrans-2018-053710</pub-id>
          <pub-id pub-id-type="pmcid">PMC6706277</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Blei</surname>
              <given-names>DM</given-names>
            </name>
            <name name-style="western">
              <surname>NG</surname>
              <given-names>AY</given-names>
            </name>
            <name name-style="western">
              <surname>Jordan</surname>
              <given-names>MI</given-names>
            </name>
            <name name-style="western">
              <surname>Lafferty</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Latent Dirichlet allocation</article-title>
          <source>Journal of Machine Learning Research</source>
          <year>2003</year>
          <volume>1</volume>
          <fpage>993</fpage>
          <lpage>1022</lpage>
          <pub-id pub-id-type="doi">10.1162/jmlr.2003.3.4-5.993</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Deerwester</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Dumais</surname>
              <given-names>ST</given-names>
            </name>
            <name name-style="western">
              <surname>Furnas</surname>
              <given-names>GW</given-names>
            </name>
            <name name-style="western">
              <surname>Landauer</surname>
              <given-names>TK</given-names>
            </name>
            <name name-style="western">
              <surname>Harshman</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Indexing by latent semantic analysis</article-title>
          <source>J. Am. Soc. Inf. Sci</source>
          <year>1990</year>
          <month>09</month>
          <volume>41</volume>
          <issue>6</issue>
          <fpage>391</fpage>
          <lpage>407</lpage>
          <pub-id pub-id-type="doi">10.1002/(sici)1097-4571(199009)41:6&#60;391::aid-asi1&#62;3.0.co;2-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hong</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Davison</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Empirical study of topic modeling in Twitter</article-title>
          <year>2010</year>
          <month>7</month>
          <day>25</day>
          <conf-name>The 16th ACM SIGKDD International Conference on Knowledge Discovery and Data Mining</conf-name>
          <conf-date>July 25-28, 2010</conf-date>
          <conf-loc>Washington DC, USA</conf-loc>
          <pub-id pub-id-type="doi">10.1145/1964858.1964870</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rashid</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Shah</surname>
              <given-names>SMA</given-names>
            </name>
            <name name-style="western">
              <surname>Irtaza</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Fuzzy topic modeling approach for text mining over short text</article-title>
          <source>Information Processing &#38; Management</source>
          <year>2019</year>
          <month>11</month>
          <volume>56</volume>
          <issue>6</issue>
          <fpage>102060</fpage>
          <pub-id pub-id-type="doi">10.1016/j.ipm.2019.102060</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mikolov</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Corrado</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Dean</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Efficient estimation of word representations in vector space</article-title>
          <source>arXiv preprint</source>
          <year>2013</year>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://export.arxiv.org/pdf/1301.3781"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Goldberg</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Levy</surname>
              <given-names>O</given-names>
            </name>
          </person-group>
          <article-title>word2vec Explained: deriving Mikolov et al.'s negative-sampling word-embedding method</article-title>
          <source>arXiv preprint</source>
          <year>2014</year>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/pdf/1402.3722.pdf"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>McMullan</surname>
              <given-names>RD</given-names>
            </name>
            <name name-style="western">
              <surname>Berle</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Arnáez</surname>
              <given-names>Sandra</given-names>
            </name>
            <name name-style="western">
              <surname>Starcevic</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>The relationships between health anxiety, online health information seeking, and cyberchondria: Systematic review and meta-analysis</article-title>
          <source>J Affect Disord</source>
          <year>2019</year>
          <month>02</month>
          <day>15</day>
          <volume>245</volume>
          <fpage>270</fpage>
          <lpage>278</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jad.2018.11.037</pub-id>
          <pub-id pub-id-type="medline">30419526</pub-id>
          <pub-id pub-id-type="pii">S0165-0327(18)31577-5</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Alghamdi</surname>
              <given-names>ES</given-names>
            </name>
            <name name-style="western">
              <surname>Alqarni</surname>
              <given-names>AS</given-names>
            </name>
            <name name-style="western">
              <surname>Bakarman</surname>
              <given-names>MM</given-names>
            </name>
            <name name-style="western">
              <surname>Moniem Mukhtar</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Bakarman</surname>
              <given-names>MA</given-names>
            </name>
          </person-group>
          <article-title>Use of internet health information among students in Jeddah, Saudi Arabia: a cross-sectional study</article-title>
          <source>GJHS</source>
          <year>2019</year>
          <month>04</month>
          <day>03</day>
          <volume>11</volume>
          <issue>5</issue>
          <fpage>51</fpage>
          <pub-id pub-id-type="doi">10.5539/gjhs.v11n5p51</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fergie</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Hunt</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Hilton</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>What young people want from health-related online resources: a focus group study</article-title>
          <source>J Youth Stud</source>
          <year>2013</year>
          <month>08</month>
          <volume>16</volume>
          <issue>5</issue>
          <fpage>579</fpage>
          <lpage>596</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/24748849"/>
          </comment>
          <pub-id pub-id-type="doi">10.1080/13676261.2012.744811</pub-id>
          <pub-id pub-id-type="medline">24748849</pub-id>
          <pub-id pub-id-type="pmcid">PMC3982905</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Song</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Song</surname>
              <given-names>TM</given-names>
            </name>
            <name name-style="western">
              <surname>Seo</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Jin</surname>
              <given-names>JH</given-names>
            </name>
          </person-group>
          <article-title>ata mining Data mining of web-based documents on social networking sites that included suicide-related words among Korean adolescents</article-title>
          <source>J Adolesc Health</source>
          <year>2016</year>
          <month>12</month>
          <volume>59</volume>
          <issue>6</issue>
          <fpage>668</fpage>
          <lpage>673</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jadohealth.2016.07.025</pub-id>
          <pub-id pub-id-type="medline">27693129</pub-id>
          <pub-id pub-id-type="pii">S1054-139X(16)30246-4</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Prabha</surname>
              <given-names>MS</given-names>
            </name>
            <name name-style="western">
              <surname>Sarojini</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Online healthcare information adoption assessment using text mining techniques</article-title>
          <source>Mobile Netw Appl</source>
          <year>2019</year>
          <month>4</month>
          <day>19</day>
          <volume>24</volume>
          <issue>4</issue>
          <fpage>1160</fpage>
          <lpage>1165</lpage>
          <pub-id pub-id-type="doi">10.1007/s11036-019-01253-3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Oh</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Park</surname>
              <given-names>MS</given-names>
            </name>
          </person-group>
          <article-title>Cancer information seeking in social question and answer services: identifying health-related topics in cancer questions on Yahoo! Answers</article-title>
          <source>Information Research-an International Electronic Journal</source>
          <year>2016</year>
          <month>9</month>
          <volume>21</volume>
          <issue>3</issue>
          <fpage>718</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://informationr.net/ir/21-3/paper718.html#.YWlbaLhByji"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Luo</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Xin</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Yuan</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Wen</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Xie</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Zhong</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Peng</surname>
              <given-names>Xiaoqing</given-names>
            </name>
            <name name-style="western">
              <surname>Ouyang</surname>
              <given-names>Wei</given-names>
            </name>
            <name name-style="western">
              <surname>Hu</surname>
              <given-names>Chao</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Fei</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Yang</given-names>
            </name>
            <name name-style="western">
              <surname>He</surname>
              <given-names>Haiyan</given-names>
            </name>
          </person-group>
          <article-title>Multidimensional feature classification of the health information needs of patients with Hypertension in an online health community through analysis of 1000 patient question records: observational study</article-title>
          <source>J Med Internet Res</source>
          <year>2020</year>
          <month>05</month>
          <day>29</day>
          <volume>22</volume>
          <issue>5</issue>
          <fpage>e17349</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2020/5/e17349/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/17349</pub-id>
          <pub-id pub-id-type="medline">32469318</pub-id>
          <pub-id pub-id-type="pii">v22i5e17349</pub-id>
          <pub-id pub-id-type="pmcid">PMC7293056</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Henderson</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Keogh</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Rosser</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Eccleston</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Searching the internet for help with pain: adolescent search, coping, and medication behaviour</article-title>
          <source>Br J Health Psychol</source>
          <year>2013</year>
          <month>02</month>
          <volume>18</volume>
          <issue>1</issue>
          <fpage>218</fpage>
          <lpage>32</lpage>
          <pub-id pub-id-type="doi">10.1111/bjhp.12005</pub-id>
          <pub-id pub-id-type="medline">23126577</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Manganello</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Sojka</surname>
              <given-names>CJ</given-names>
            </name>
          </person-group>
          <article-title>An exploratory study of health literacy and African American adolescents</article-title>
          <source>Comprehensive Child and Adolescent Nursing</source>
          <year>2016</year>
          <month>07</month>
          <day>20</day>
          <volume>39</volume>
          <issue>3</issue>
          <fpage>221</fpage>
          <lpage>239</lpage>
          <pub-id pub-id-type="doi">10.1080/24694193.2016.1196264</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wetterlin</surname>
              <given-names>FM</given-names>
            </name>
            <name name-style="western">
              <surname>Mar</surname>
              <given-names>MY</given-names>
            </name>
            <name name-style="western">
              <surname>Neilson</surname>
              <given-names>EK</given-names>
            </name>
            <name name-style="western">
              <surname>Werker</surname>
              <given-names>GR</given-names>
            </name>
            <name name-style="western">
              <surname>Krausz</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>eMental health experiences and expectations: a survey of youths' Web-based resource preferences in Canada</article-title>
          <source>J Med Internet Res</source>
          <year>2014</year>
          <month>12</month>
          <day>17</day>
          <volume>16</volume>
          <issue>12</issue>
          <fpage>e293</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2014/12/e293/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/jmir.3526</pub-id>
          <pub-id pub-id-type="medline">25519847</pub-id>
          <pub-id pub-id-type="pii">v16i12e293</pub-id>
          <pub-id pub-id-type="pmcid">PMC4275486</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lal</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Nguyen</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Theriault</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Seeking mental health information and support online: experiences and perspectives of young people receiving treatment for first-episode psychosis</article-title>
          <source>Early Interv Psychiatry</source>
          <year>2018</year>
          <month>06</month>
          <day>26</day>
          <volume>12</volume>
          <issue>3</issue>
          <fpage>324</fpage>
          <lpage>330</lpage>
          <pub-id pub-id-type="doi">10.1111/eip.12317</pub-id>
          <pub-id pub-id-type="medline">26810026</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pretorius</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Chambers</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Coyle</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Young people's online help-seeking and mental health difficulties: systematic narrative review</article-title>
          <source>J Med Internet Res</source>
          <year>2019</year>
          <month>11</month>
          <day>19</day>
          <volume>21</volume>
          <issue>11</issue>
          <fpage>e13873</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2019/11/e13873/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/13873</pub-id>
          <pub-id pub-id-type="medline">31742562</pub-id>
          <pub-id pub-id-type="pii">v21i11e13873</pub-id>
          <pub-id pub-id-type="pmcid">PMC6891826</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Buhi</surname>
              <given-names>ER</given-names>
            </name>
            <name name-style="western">
              <surname>Daley</surname>
              <given-names>EM</given-names>
            </name>
            <name name-style="western">
              <surname>Fuhrmann</surname>
              <given-names>HJ</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>SA</given-names>
            </name>
          </person-group>
          <article-title>An observational study of how young people search for online sexual health information</article-title>
          <source>J Am Coll Health</source>
          <year>2009</year>
          <month>09</month>
          <volume>58</volume>
          <issue>2</issue>
          <fpage>101</fpage>
          <lpage>11</lpage>
          <pub-id pub-id-type="doi">10.1080/07448480903221236</pub-id>
          <pub-id pub-id-type="medline">19892646</pub-id>
          <pub-id pub-id-type="pii">Y826186835U6HX25</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Magee</surname>
              <given-names>JC</given-names>
            </name>
            <name name-style="western">
              <surname>Bigelow</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Dehaan</surname>
              <given-names>Samantha</given-names>
            </name>
            <name name-style="western">
              <surname>Mustanski</surname>
              <given-names>BS</given-names>
            </name>
          </person-group>
          <article-title>Sexual health information seeking online: a mixed-methods study among lesbian, gay, bisexual, and transgender young people</article-title>
          <source>Health Educ Behav</source>
          <year>2012</year>
          <month>06</month>
          <day>13</day>
          <volume>39</volume>
          <issue>3</issue>
          <fpage>276</fpage>
          <lpage>89</lpage>
          <pub-id pub-id-type="doi">10.1177/1090198111401384</pub-id>
          <pub-id pub-id-type="medline">21490310</pub-id>
          <pub-id pub-id-type="pii">1090198111401384</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Martin</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Young People'S Sexual Health Literacy: Seeking, Understanding, and Evaluating Online Sexual Health Information</article-title>
          <source>University of Glasgow</source>
          <year>2017</year>
          <access-date>2021-07-13</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://theses.gla.ac.uk/8528/">https://theses.gla.ac.uk/8528/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fergie</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Hilton</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Hunt</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Young adults' experiences of seeking online information about diabetes and mental health in the age of social media</article-title>
          <source>Health Expect</source>
          <year>2016</year>
          <month>12</month>
          <day>08</day>
          <volume>19</volume>
          <issue>6</issue>
          <fpage>1324</fpage>
          <lpage>1335</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1111/hex.12430"/>
          </comment>
          <pub-id pub-id-type="doi">10.1111/hex.12430</pub-id>
          <pub-id pub-id-type="medline">26647109</pub-id>
          <pub-id pub-id-type="pmcid">PMC5139057</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Duduciuc</surname>
              <given-names>AC</given-names>
            </name>
          </person-group>
          <article-title>Online health information seeking during adolescence: a quantitative study regarding Romanian teenagers</article-title>
          <source>SCECO. Economic Edition</source>
          <year>2015</year>
          <month>12</month>
          <day>29</day>
          <issue>22</issue>
          <fpage>89</fpage>
          <lpage>95</lpage>
          <pub-id pub-id-type="doi">10.29358/sceco.v0i22.329</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Montagni</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Cariou</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Feuillet</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Langlois</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Tzourio</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Exploring digital health use and opinions of university students: field survey study</article-title>
          <source>JMIR Mhealth Uhealth</source>
          <year>2018</year>
          <month>03</month>
          <day>15</day>
          <volume>6</volume>
          <issue>3</issue>
          <fpage>e65</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://mhealth.jmir.org/2018/3/e65/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/mhealth.9131</pub-id>
          <pub-id pub-id-type="medline">29549071</pub-id>
          <pub-id pub-id-type="pii">v6i3e65</pub-id>
          <pub-id pub-id-type="pmcid">PMC5876492</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Yen</surname>
              <given-names>DC</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>X</given-names>
            </name>
          </person-group>
          <article-title>Disease risk and its moderating effect on the e-consultation market offline and online signals</article-title>
          <source>ITP</source>
          <year>2019</year>
          <month>08</month>
          <day>05</day>
          <volume>32</volume>
          <issue>4</issue>
          <fpage>1065</fpage>
          <lpage>1084</lpage>
          <pub-id pub-id-type="doi">10.1108/itp-03-2018-0127</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="web">
          <article-title>Chinese medical subject headings</article-title>
          <source>Institute of Medical Information, Chinese Academy of Medical Sciences</source>
          <access-date>2021-07-13</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://cmesh.imicams.ac.cn/index.action?action=index&#38;noMsg=1">http://cmesh.imicams.ac.cn/index.action?action=index&#38;noMsg=1</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Abdi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Shamsuddin</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Hasan</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Piran</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Deep learning-based sentiment classification of evaluative text based on Multi-feature fusion</article-title>
          <source>Information Processing &#38; Management</source>
          <year>2019</year>
          <volume>56</volume>
          <issue>4</issue>
          <fpage>1245</fpage>
          <lpage>1259</lpage>
          <pub-id pub-id-type="doi">10.1016/j.ipm.2019.02.018</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Devlin</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Toutanova</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Bert: Pre-training of deep bidirectional transformers for language understanding</article-title>
          <source>arXiv preprint</source>
          <year>2018</year>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/pdf/1810.04805.pdf"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Reimers</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Gurevych</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>Sentence-BERT: Sentence embeddings using Siamese BERT-networks</article-title>
          <year>2019</year>
          <conf-name>Proceedings of the 2019 Conference on Empirical Methods in Natural Language Processing and the 9th International Joint Conference on Natural Language Processing</conf-name>
          <conf-date>November 03- 07，2019</conf-date>
          <conf-loc>Hong Kong, China</conf-loc>
          <fpage>1908.10084</fpage>
          <pub-id pub-id-type="doi">10.18653/v1/D19-1410</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Jie</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Lianyu</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>Clustering algorithms research</article-title>
          <source>Journal of Software</source>
          <year>2008</year>
          <month>06</month>
          <day>30</day>
          <volume>19</volume>
          <issue>1</issue>
          <fpage>48</fpage>
          <lpage>61</lpage>
          <pub-id pub-id-type="doi">10.3724/sp.j.1001.2008.00048</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rousseeuw</surname>
              <given-names>PJ</given-names>
            </name>
          </person-group>
          <article-title>Silhouettes: A graphical aid to the interpretation and validation of cluster analysis</article-title>
          <source>Journal of Computational and Applied Mathematics</source>
          <year>1987</year>
          <month>11</month>
          <volume>20</volume>
          <fpage>53</fpage>
          <lpage>65</lpage>
          <pub-id pub-id-type="doi">10.1016/0377-0427(87)90125-7</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Yoshida</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Q</given-names>
            </name>
          </person-group>
          <article-title>Text clustering using frequent itemsets</article-title>
          <source>Knowledge-Based Systems</source>
          <year>2010</year>
          <month>7</month>
          <volume>23</volume>
          <issue>5</issue>
          <fpage>379</fpage>
          <lpage>388</lpage>
          <pub-id pub-id-type="doi">10.1016/j.knosys.2010.01.011</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Salton</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Buckley</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Term-weighting approaches in automatic text retrieval</article-title>
          <source>Information Processing &#38; Management</source>
          <year>1988</year>
          <month>1</month>
          <volume>24</volume>
          <issue>5</issue>
          <fpage>513</fpage>
          <lpage>523</lpage>
          <pub-id pub-id-type="doi">10.1016/0306-4573(88)90021-0</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref49">
        <label>49</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vinh</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Epps</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Bailey</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Information theoretic measures for clusterings comparison: Variants, properties, normalization and correction for chance</article-title>
          <source>The Journal of Machine Learning Research</source>
          <year>2010</year>
          <volume>11</volume>
          <fpage>2837</fpage>
          <lpage>2854</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmlr.org/papers/volume11/vinh10a/vinh10a.pdf"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref50">
        <label>50</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rojas</surname>
              <given-names>TJ</given-names>
            </name>
            <name name-style="western">
              <surname>Santos</surname>
              <given-names>PM</given-names>
            </name>
            <name name-style="western">
              <surname>Mora</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>New version of davies-bouldin index for clustering validation based on cylindrical distance</article-title>
          <year>2013</year>
          <conf-name>32nd International Conference of the Chilean Computer Science Society (SCCC)</conf-name>
          <conf-date>Nov 11-15, 2013</conf-date>
          <conf-loc>Temuco, Chile</conf-loc>
          <fpage>49</fpage>
          <lpage>53</lpage>
          <pub-id pub-id-type="doi">10.1109/sccc.2013.29</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref51">
        <label>51</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nguyen</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Epps</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Bailey</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Information theoretic measures for clusterings comparison: is a correction for chance necessary?</article-title>
          <year>2009</year>
          <conf-name>ICML '09: Proceedings of the 26th Annual International Conference on Machine Learning</conf-name>
          <conf-date>June 14-18, 2009</conf-date>
          <conf-loc>Montreal, QC, Canada</conf-loc>
          <fpage>1073</fpage>
          <lpage>1080</lpage>
          <pub-id pub-id-type="doi">10.1145/1553374.1553511</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref52">
        <label>52</label>
        <nlm-citation citation-type="web">
          <article-title>The 45th China Statistical Report on Internet Development</article-title>
          <source>China Internet Network Information Center</source>
          <access-date>2021-07-13</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.cnnic.net.cn/hlwfzyj/hlwxzbg/hlwtjbg/202004/P020200428596599037028.pdf">http://www.cnnic.net.cn/hlwfzyj/hlwxzbg/hlwtjbg/202004/P020200428596599037028.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref53">
        <label>53</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>X</given-names>
            </name>
          </person-group>
          <article-title>, Chang, C</article-title>
          <source>The possibility of online education applying in sex education among adolescents. Chinese Journal of Health Education</source>
          <year>2019</year>
          <volume>35</volume>
          <issue>08</issue>
          <fpage>739</fpage>
          <lpage>743</lpage>
          <pub-id pub-id-type="doi">10.16168/j.cnki.issn.1002-9982.2019.08.014</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref54">
        <label>54</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gao</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Research on the Influence of Social Media Health Information Attention on College Students’ Health Behavior and Cognition</article-title>
          <source>CNKI</source>
          <year>2017</year>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://cdmd.cnki.com.cn/Article/CDMD-10475-1017231135.htm">http://cdmd.cnki.com.cn/Article/CDMD-10475-1017231135.htm</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref55">
        <label>55</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>An investigation report on the dietary health of College Students</article-title>
          <source>Journal of Hebei Institute of Socialism</source>
          <year>2009</year>
          <volume>02</volume>
          <fpage>93</fpage>
          <lpage>96</lpage>
          <pub-id pub-id-type="doi">10.3969/j.issn.1009-6981.2009.02.034</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref56">
        <label>56</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Huan</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Absence and make up of nutrition policy in youth health promotion</article-title>
          <source>Journal of Hebei Institute of Socialism</source>
          <year>2018</year>
          <volume>24</volume>
          <fpage>5</fpage>
          <lpage>10</lpage>
          <pub-id pub-id-type="doi">10.3969/j.issn.1006-9577.2018.03.001</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref57">
        <label>57</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Guo</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Hao</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Correlative research among adolescents' health literacy, psychological behavioral problems, and help-seeking attitude and willingness</article-title>
          <source>Chinese Nursing Research</source>
          <year>2017</year>
          <volume>31</volume>
          <issue>16</issue>
          <fpage>1951</fpage>
          <lpage>1955</lpage>
          <pub-id pub-id-type="doi">10.3969/j.issn.1009-6493.2017.16.010</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
