<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMI</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Med Inform</journal-id>
      <journal-title>JMIR Medical Informatics</journal-title>
      <issn pub-type="epub">2291-9694</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v8i4e17642</article-id>
      <article-id pub-id-type="pmid">32324148</article-id>
      <article-id pub-id-type="doi">10.2196/17642</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Using Natural Language Processing Techniques to Provide Personalized Educational Materials for Chronic Disease Patients in China: Development and Assessment of a Knowledge-Based Health Recommender System</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Eysenbach</surname>
            <given-names>Gunther</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Lu</surname>
            <given-names>Xudong</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Dery</surname>
            <given-names>Julien</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Wiesner</surname>
            <given-names>Martin</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Schnell</surname>
            <given-names>Michael</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Ndabu</surname>
            <given-names>Theophile</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author">
          <name name-style="western">
            <surname>Wang</surname>
            <given-names>Zheyu</given-names>
          </name>
          <degrees>BSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-3879-1501</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Huang</surname>
            <given-names>Haoce</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-4468-3152</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Cui</surname>
            <given-names>Liping</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-3640-3007</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Chen</surname>
            <given-names>Juan</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-5801-9124</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>An</surname>
            <given-names>Jiye</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-6149-7052</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author">
          <name name-style="western">
            <surname>Duan</surname>
            <given-names>Huilong</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-3893-213X</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author">
          <name name-style="western">
            <surname>Ge</surname>
            <given-names>Huiqing</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-5822-2998</ext-link>
        </contrib>
        <contrib id="contrib8" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Deng</surname>
            <given-names>Ning</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Ministry of Education Key Laboratory of Biomedical Engineering</institution>
            <institution>College of Biomedical Engineering and Instrument Science</institution>
            <institution>Zhejiang University</institution>
            <addr-line>38 Zheda Rd, Zhouyiqing Bldg 512</addr-line>
            <addr-line>Yuquan Campus</addr-line>
            <addr-line>Hangzhou</addr-line>
            <country>China</country>
            <phone>86 571 2295 2693</phone>
            <email>zju.dengning@gmail.com</email>
          </address>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-6573-1061</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Ministry of Education Key Laboratory of Biomedical Engineering</institution>
        <institution>College of Biomedical Engineering and Instrument Science</institution>
        <institution>Zhejiang University</institution>
        <addr-line>Hangzhou</addr-line>
        <country>China</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Engineering Research Center of Cognitive Healthcare of Zhejiang Province (Sir Run Run Shaw Hospital)</institution>
        <institution>Zhejiang University</institution>
        <addr-line>Hangzhou</addr-line>
        <country>China</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>General Hospital of Ningxia Medical University</institution>
        <addr-line>Yinchuan</addr-line>
        <country>China</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>Sir Run-Run Shaw Hospital</institution>
        <institution>Zhejiang University School of Medicine</institution>
        <institution>Zhejiang University</institution>
        <addr-line>Hangzhou</addr-line>
        <country>China</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Ning Deng <email>zju.dengning@gmail.com</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <month>4</month>
        <year>2020</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>23</day>
        <month>4</month>
        <year>2020</year>
      </pub-date>
      <volume>8</volume>
      <issue>4</issue>
      <elocation-id>e17642</elocation-id>
      <history>
        <date date-type="received">
          <day>30</day>
          <month>12</month>
          <year>2019</year>
        </date>
        <date date-type="rev-request">
          <day>27</day>
          <month>1</month>
          <year>2020</year>
        </date>
        <date date-type="rev-recd">
          <day>20</day>
          <month>3</month>
          <year>2020</year>
        </date>
        <date date-type="accepted">
          <day>3</day>
          <month>4</month>
          <year>2020</year>
        </date>
      </history>
      <copyright-statement>©Zheyu Wang, Haoce Huang, Liping Cui, Juan Chen, Jiye An, Huilong Duan, Huiqing Ge, Ning Deng. Originally published in JMIR Medical Informatics (http://medinform.jmir.org), 23.04.2020.</copyright-statement>
      <copyright-year>2020</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Informatics, is properly cited. The complete bibliographic information, a link to the original publication on http://medinform.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="http://medinform.jmir.org/2020/4/e17642/" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Health education emerged as an important intervention for improving the awareness and self-management abilities of chronic disease patients. The development of information technologies has changed the form of patient educational materials from traditional paper materials to electronic materials. To date, the amount of patient educational materials on the internet is tremendous, with variable quality, which makes it hard to identify the most valuable materials by individuals lacking medical backgrounds.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>The aim of this study was to develop a health recommender system to provide appropriate educational materials for chronic disease patients in China and evaluate the effect of this system.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>A knowledge-based recommender system was implemented using ontology and several natural language processing (NLP) techniques. The development process was divided into 3 stages. In stage 1, an ontology was constructed to describe patient characteristics contained in the data. In stage 2, an algorithm was designed and implemented to generate recommendations based on the ontology. Patient data and educational materials were mapped to the ontology and converted into vectors of the same length, and then recommendations were generated according to similarity between these vectors. In stage 3, the ontology and algorithm were incorporated into an mHealth system for practical use. Keyword extraction algorithms and pretrained word embeddings were used to preprocess educational materials. Three strategies were proposed to improve the performance of keyword extraction. System evaluation was based on a manually assembled test collection for 50 patients and 100 educational documents. Recommendation performance was assessed using the macro precision of top-ranked documents and the overall mean average precision (MAP).</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>The constructed ontology contained 40 classes, 31 object properties, 67 data properties, and 32 individuals. A total of 80 SWRL rules were defined to implement the semantic logic of mapping patient original data to the ontology vector space. The recommender system was implemented as a separate Web service connected with patients' smartphones. According to the evaluation results, our system can achieve a macro precision up to 0.970 for the top 1 recommendation and an overall MAP score up to 0.628.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>This study demonstrated that a knowledge-based health recommender system has the potential to accurately recommend educational materials to chronic disease patients. Traditional NLP techniques combined with improvement strategies for specific language and domain proved to be effective for improving system performance. One direction for future work is to explore the effect of such systems from the perspective of patients in a practical setting.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>health education</kwd>
        <kwd>ontology</kwd>
        <kwd>natural language processing</kwd>
        <kwd>chronic disease</kwd>
        <kwd>recommender system</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <sec>
        <title>Background</title>
        <p>Chronic (or noncommunicable) diseases are the most prevalent and costly conditions worldwide [<xref ref-type="bibr" rid="ref1">1</xref>]. To improve the survival rate and life quality of chronic disease patients, long-term self-management and supervision and intervention from doctors are essential [<xref ref-type="bibr" rid="ref2">2</xref>]. However, in practice, some patients don’t perform effective self-management regimes due to the lack of necessary knowledge, skills, and confidence, which results in decreased treatment effectiveness or even treatment failure [<xref ref-type="bibr" rid="ref3">3</xref>-<xref ref-type="bibr" rid="ref6">6</xref>]. Health education from health care providers has been considered an important intervention for improving patient awareness and self-management abilities in chronic disease management [<xref ref-type="bibr" rid="ref7">7</xref>-<xref ref-type="bibr" rid="ref9">9</xref>].</p>
        <p>The development of information technologies has promoted the advent of eHealth-enhanced chronic disease management, which changed the form of patient educational materials from traditional paper materials to electronic materials [<xref ref-type="bibr" rid="ref10">10</xref>-<xref ref-type="bibr" rid="ref13">13</xref>]. Patients can either receive expert-vetted materials from their doctors or perform self-learning on the internet. To date, a large amount of patient educational materials exist on the internet; however, the quality of health information in these materials is highly variable [<xref ref-type="bibr" rid="ref14">14</xref>-<xref ref-type="bibr" rid="ref17">17</xref>]. Patients without a medical background may find it hard to identify the most relevant and valuable materials for themselves [<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref19">19</xref>]. A system that is capable of automatically identifying and recommending appropriate materials to patients based on their needs [<xref ref-type="bibr" rid="ref20">20</xref>] or preferences [<xref ref-type="bibr" rid="ref21">21</xref>] would be applicable to solve the above problems. Such a system can be categorized as a kind of health recommender system (HRS).</p>
        <p>As one of the specializations of recommender systems, an HRS aims to recommend relevant medical information to health professionals or patients [<xref ref-type="bibr" rid="ref22">22</xref>]. A number of works regarding the design and implementation of HRSs have been published, providing recommendations in different areas such as diets [<xref ref-type="bibr" rid="ref23">23</xref>], health care services [<xref ref-type="bibr" rid="ref24">24</xref>], educational materials [<xref ref-type="bibr" rid="ref25">25</xref>], and decision-making advice for doctors [<xref ref-type="bibr" rid="ref26">26</xref>]. Pincay et al [<xref ref-type="bibr" rid="ref27">27</xref>] summarized HRSs into 4 recommendation areas: wellness, diagnosis and medication, health care services, and medical resources. Among these areas, patient educational materials belong to the medical resources. Given the fact that only 3% of the articles focused on this area [<xref ref-type="bibr" rid="ref27">27</xref>], in this study we aimed to develop an HRS to provide personalized educational materials for patients with chronic diseases.</p>
      </sec>
      <sec>
        <title>Related Work</title>
        <p>In a health context, multiple methods from the computer science field have been applied to compute relevant recommendations. According to a review [<xref ref-type="bibr" rid="ref22">22</xref>], two main approaches were used for HRSs. One is the information retrieval (IR) approach, in which the recommendations are generated based on a query that describes the user’s information interest. Another approach is the recommendation algorithm (RA) approach, which has been widely used in the context of online shopping and advertisement [<xref ref-type="bibr" rid="ref28">28</xref>]. Unlike the IR approach that returns relevant results matching the user query, the RA approach generates personalized results tailored to the users’ potential needs or preferences.</p>
        <p>Among different RA approaches [<xref ref-type="bibr" rid="ref29">29</xref>], the most applied methods in HRSs are collaborative filtering, content-based, and knowledge-based methods [<xref ref-type="bibr" rid="ref27">27</xref>]. The collaborative filtering method recommends to the active user the items that other users with similar preferences liked in the past [<xref ref-type="bibr" rid="ref30">30</xref>]. One major drawback of collaborative filtering is the cold-start problem, referring to the problem that a new user who has not rated any items cannot receive recommendations (called new user problem) or a new item with too few ratings cannot be recommended (called new item problem). Compared with collaborative filtering, the content-based method solves the new item problem by recommending items with content-similar features as the user liked in the past. The similarity of items is calculated based on the features associated with the compared items [<xref ref-type="bibr" rid="ref31">31</xref>]. The knowledge-based method can be viewed as an extension of the content-based method, by considering how items meet user preferences or needs based on domain knowledge, instead of user ratings [<xref ref-type="bibr" rid="ref32">32</xref>]. Ontologies are often used for knowledge representation in the knowledge-based method [<xref ref-type="bibr" rid="ref33">33</xref>].</p>
        <p>Compared with collaborative filtering and the traditional content-based method, the knowledge-based method is considered more appropriate in the context of e-learning. In e-learning environments, different learners have different characteristics such as background knowledge, learning history, and competence level; therefore, even if two learners have similar ratings, they will require different recommendations if their characteristics are not the same [<xref ref-type="bibr" rid="ref34">34</xref>]. Conventional RAs such as collaborative filtering and content-based methods recommend items to users based solely on ratings, while the knowledge-based method can personalize user profiles to match the user characteristics through knowledge models such as ontologies [<xref ref-type="bibr" rid="ref35">35</xref>]. The aggregation of domain knowledge about the learner and learning resources has been proven to improve the quality of recommendations, meanwhile alleviating other conventional drawbacks such as cold-start and rating sparsity problems [<xref ref-type="bibr" rid="ref36">36</xref>]. Since patient self-learning based on electronic materials can be considered as a kind of e-learning, a knowledge-based HRS may be a better choice to incorporate additional information about patients for recommendation.</p>
        <p>Several studies have explored the feasibility of an HRS for recommending patient educational materials. Kandula et al [<xref ref-type="bibr" rid="ref20">20</xref>] used the IR approach to recommend relevant educational materials to diabetic patients. They applied the topic modeling method (latent Dirichlet allocation) to identify and match topics between educational materials and patients’ electronic medical records. Zeng et al [<xref ref-type="bibr" rid="ref37">37</xref>] also adopted the IR approach to recommend educational materials for diabetic patients. Instead of inferring patients’ needs from electronic medical record notes, they constructed patients’ questions on the forum as a query and then compared two algorithms (latent Dirichlet allocation and semantic group). Sanchez et al [<xref ref-type="bibr" rid="ref25">25</xref>] built a content-based recommender system that links patients to reputable health educational websites from MedlinePlus for a given health video from YouTube. They used the BioPortal application programming interface (API) to extract Systematized Nomenclature of Medicine–Clinical Terms (SNOMED-CT) terms from videos viewed by patients, and then used the MedlinePlus API to provide relevant MedlinePlus recommendations based on these terms. In their subsequent work [<xref ref-type="bibr" rid="ref38">38</xref>], they introduced natural language processing (NLP) techniques to extract SNOMED-CT terms from video content, and then added the Bio-ontology API to improve the results for obtaining synonymous MedlinePlus terms. Wang et al [<xref ref-type="bibr" rid="ref21">21</xref>] implemented a cloud-based mobile health information recommendation system that included a collaborative recommender and a physiological indicator-based recommender. These studies proved that HRSs have the potential to provide personalized education for patients using different information technologies. However, to the best of our knowledge, no studies to date have formally concentrated on a knowledge-based HRS for chronic disease patient education. Moreover, most of the materials are in English; no studies have provided the feasibility evidence of recommending materials in Chinese.</p>
      </sec>
      <sec>
        <title>Objectives</title>
        <p>Here we propose a knowledge-based HRS that recommends relevant educational materials to chronic disease patients according to their health data. The materials are limited to Chinese documents, and several NLP techniques will be used to preprocess the text-based materials. Further, this study explores the effect of the system through a pilot evaluation based on a manually annotated test collection.</p>
      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Study Design</title>
        <p>In this study, we had a corpus of patient educational materials retrieved from multiple sources and a data set of patients collected from a telehealth system. The task of this study was to design and implement an automated recommender system that can discover patients’ potential needs from their health data, and then recommend the most relevant educational materials to them. In addition, we needed to design an assessment method to evaluate system performance.</p>
        <p>The study was designed based on these tasks. <xref rid="figure1" ref-type="fig">Figure 1</xref> illustrates the overall study design. The complete recommendation process is presented in the dotted box. The core of the recommendation process is a custom ontology called Chronic Disease Patient Education Ontology (CDPEO), which describes patient characteristics for recommendation generation. Patient data and educational materials will be converted to vectors through CDPEO. Patient vectors and text vectors will have the same length, and the final recommendation results will be generated based on the similarity between these vectors. Patient data will be converted through a rule-based approach (blue arrows in <xref rid="figure1" ref-type="fig">Figure 1</xref>), while educational materials will be converted through an NLP-based approach (red arrows in <xref rid="figure1" ref-type="fig">Figure 1</xref>). System evaluation will be conducted based on a test collection of educational materials manually assembled by domain experts (black arrows in <xref rid="figure1" ref-type="fig">Figure 1</xref>).</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Overall study design.</p>
          </caption>
          <graphic xlink:href="medinform_v8i4e17642_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Data Collection</title>
        <p>Patient educational materials used in this study came from multiple sources including websites, guidelines, and books, which have been reviewed and approved by several physicians (see <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> for further information). We retrieved 88,746 documents in Chinese from these sources. Among these documents, 511 were manually extracted in the form of plain text from the guidelines or books, while the others were crawled from the websites and transformed into plain text using a Python software library called Beautiful Soup. Patient data used in this study came from a telehealth system, which is a pathway-driven mobile health (mHealth) system for chronic disease management. The system aims to provide comprehensive self-management support for patients and executable intervention plans for care providers [<xref ref-type="bibr" rid="ref39">39</xref>,<xref ref-type="bibr" rid="ref40">40</xref>]. Currently, more than 5000 patients are using this system in Ningxia and Zhejiang provinces. We randomly selected 50 patients and collected their data to develop and test our recommender system. Data included demographics, laboratory test results, disease histories, self-monitoring records, and questionnaire results.</p>
      </sec>
      <sec>
        <title>Informed Consent and Ethical Consideration</title>
        <p>Patients registered in the telehealth system have signed inform consent forms for accessing and using their privacy data. The domain experts signed informed consent forms as well. All procedures were performed in accordance with the ethical guidelines for biomedical research involving human subjects at Ningxia Medical University.</p>
      </sec>
      <sec>
        <title>System Development Steps</title>
        <sec>
          <title>Overview</title>
          <p>The development process of the system can be divided into 3 stages. In stage 1, we constructed an ontology (CDPEO) for patient education mainly based on the collected data and materials. In stage 2, we designed and implemented an algorithm to generate the recommendations based on the ontology. In stage 3, we integrated the ontology and the algorithm into our mHealth system for practical use.</p>
        </sec>
        <sec>
          <title>Stage 1: Ontology Construction</title>
          <p>The construction of CDPEO followed a widely used ontology engineering methodology [<xref ref-type="bibr" rid="ref41">41</xref>], as shown in <xref rid="figure2" ref-type="fig">Figure 2</xref>. First, we defined the domain and scope of CDPEO by sketching a list of questions the ontology should be able to answer. This method is called competency questions [<xref ref-type="bibr" rid="ref42">42</xref>]. Through this step, we confirmed that CDPEO will be used as a reference model for the representation of patient data and educational materials, and the intended output of CDPEO is a comprehensive label set for patient education. Second, we searched for reusable existing ontologies on BioPortal (a Web repository of biomedical ontologies) using keywords “hypertension,” “diabetes,” “chronic disease,” and “patient education.” A total of 9 ontologies were screened. However, due to the specific domain of our ontology, classes and properties defined in the existing ontologies could hardly be refined for our particular task. Therefore, we created CDPEO from scratch. Third, we collected all terminologies that might be used in the ontology. These terms were mainly collected from educational materials and patient data records. We selected terms able to describe patient characteristics or material topics, as well as concepts that might be involved in the recommendation process. All terms were originally in Chinese, translated into English for ontology construction. After applying this step, we obtained a relatively comprehensive term list with 54 terms. The term list was reviewed by the physicians as well. The detailed outputs of these 3 steps can be found in <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>.</p>
          <p>Fourth, based on the term list, we defined the classes and the class hierarchy of CDPEO through a top-down approach, which started with defining the most general concepts in the domain and subsequently specializing the concepts. CDPEO was built in two main levels of abstraction. Level 1 included 5 terms (demographic, disease, physiological index, lifestyle, and medication) that described characteristics contained in patient data. Level 2 included the detailed elements for each of the level 1 classes. Fifth, we defined the properties of classes based on the remaining terms to describe the internal structure of concepts. The properties consisted of two types: object properties and data properties. Object properties are relations between two individuals (ie, instances of classes), while data properties describe relations between an individual and a data value.</p>
          <p>Sixth, we defined property restrictions to complete the precise semantics of the classes. These restrictions were represented as a set of axioms including property and individual axioms. Property axioms described the facets of properties such as value type, number of values, and domain and scope of properties. Individual axioms described anonymous classes of individuals based on the relations that members of the class participate in. Seventh, we created individual instances of classes in the hierarchy. CDPEO was instantiated by the patient data. We defined a class called patient profile in the top level to be the core component of the instances. The characteristic instances were created and bound to the patient profile instance. Finally, we used the Semantic Web Rule Language (SWRL) [<xref ref-type="bibr" rid="ref43">43</xref>] to encode rules for complex inferences, for example, generating a new property of an instance. SWRL is based on rule markup language and compatible with the W3C Web Ontology Language (OWL) [<xref ref-type="bibr" rid="ref43">43</xref>]. In CDPEO, the SWRL rules were defined to evaluate the patient data and generate a fixed-length vector (33-dimensional) for recommendation generation.</p>
          <fig id="figure2" position="float">
            <label>Figure 2</label>
            <caption>
              <p>Chronic Disease Patient Education Ontology construction steps.</p>
            </caption>
            <graphic xlink:href="medinform_v8i4e17642_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
        <sec>
          <title>Stage 2: Recommendation Generation</title>
          <p>Based on the constructed ontology, we designed and implemented an algorithm to automatically generate recommendations of educational materials given patient data. The core idea of the algorithm was mapping patient data and educational materials to an identical vector space. The vector space came from the ontology, containing 33 terms that can describe patient data characteristics and document topics. The complete recommendation generation steps are shown in <xref rid="figure3" ref-type="fig">Figure 3</xref>.</p>
          <p>For patient data, we used SWRL rules to infer the item values of the vector. The values were in the range of 0 to 3, which indicated the severity of the corresponding term. For example, in the vector space existed a term called blood pressure (BP), whose value was inferred based on the latest self-monitoring record of the patient. If the BP record was below 140/90 mm Hg, then the item value would be 0, otherwise the value would be 1, 2, or 3 based on the severity of the BP record (3 means the worst). All reasoning procedures were completed by the SWRL rules, and the results were saved as data properties of the corresponding patient profile instance.</p>
          <p>For educational materials, we applied an NLP-based approach to map documents to the vector space. First, we summarized the topic of each document by keywords. In this study, we used 2 famous statistical algorithms, term frequency–inverse document frequency (TF-IDF) [<xref ref-type="bibr" rid="ref44">44</xref>] and TextRank [<xref ref-type="bibr" rid="ref45">45</xref>], to extract keywords from educational materials. In TF-IDF, the IDF scores were calculated from the educational material corpus; in TextRank, undirected graphs for a co-occurrence window of 2 were used. Five keywords were extracted for each document. Furthermore, three strategies were introduced to improve extraction performance specifically for Chinese educational materials: weight assignment, compound word identification, and synonym elimination. <xref ref-type="table" rid="table1">Table 1</xref> summarizes these strategies, with a description of each strategy and its effects. A simple example of each strategy for intuitive interpretation can be found in <xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref>.</p>
          <p>In weight assignment, we set an additional weight value for some words based on the observation of the corpus. We observed that for patient educational materials in Chinese, title words and nouns were more likely to be the keywords while verbs were less likely to be the keywords. When performing keyword extraction, a weight greater than 1 could improve the likelihood of being the keyword while a weight less than 1 could reduce the likelihood. Consequently, weights of 3, 1.2, and 0.8 were assigned to title words, nouns, and verbs, respectively, by the investigators based on multiple experiments.</p>
          <p>In compound word identification, we aimed to identify compound words in patient educational materials. For Chinese documents, sentences need to be segmented into pieces of words, since all words are organized together without blanks in Chinese sentences. We observed that for patient educational materials in Chinese, a compound word was often segmented into separate atom words by the word segmentation algorithm. However, a compound word usually contains more information than a single atom word, and thus is more appropriate for being the keyword. To solve this problem, we designed several filter conditions to identify all compound words in educational materials before word segmentation, and then generated a user-defined dictionary of compound words to customize word segmentation. The filter conditions included co-occurrence frequency, part-of-speech tag for each atom word, and arrangement of atom words.</p>
          <p>In synonym elimination, we aimed to eliminate synonyms in the extracted keywords. Synonyms here refer to words composed with similar Chinese characters. We noticed that after introducing compound word identification, synonyms appeared more frequently in keyword extraction. To eliminate these synonyms, we converted each keyword candidate into a one-hot vector based on its character composition. The cosine similarity between each keyword was then calculated to determine if these keywords belong to synonyms. For the identified synonym pair, the longer one was retained while the shorter one was eliminated, since in Chinese longer synonyms usually contain the information in shorter synonyms.</p>
          <p>Second, the extracted keywords were mapped to the ontology vector space to generate the text vector based on cosine similarity between keywords and vector items. Similarity was calculated based on a pretrained word embedding of each keyword and vector item. In this study, we used the classic Word2Vec model to obtain statistic embedding vectors for each word [<xref ref-type="bibr" rid="ref46">46</xref>,<xref ref-type="bibr" rid="ref47">47</xref>]. The model architecture used was the continuous bag-of-words architecture with a window size of 5, and the training algorithm was the negative sampling method. The training corpus was the collected 88,746 documents concerned with patient education. The item value of the text vector was calculated by the sum of a subset of similarity values between the corresponding item and all keywords. <xref rid="figure4" ref-type="fig">Figure 4</xref> shows the concrete calculation process, in which <italic>T<sub>j</sub></italic> corresponds to the <italic>j</italic>-th item of the text vector, <italic>n</italic> corresponds to the dimension of the pretrained word embeddings (in this study, <italic>n</italic>=200), threshold corresponds to a value between 0 and 1 (in this study, threshold=0.5).</p>
          <p>Given the patient vectors and text vectors, we calculated the inner product of each vector pair to indicate the correlation between patient data and educational materials. The inner product can be interpreted as a nonnormalized cosine similarity that considers the similarity of vectors in both direction and magnitude, as shown in <xref rid="figure5" ref-type="fig">Figure 5</xref>, where <italic>n</italic> corresponds to the dimension of the vector (in this study, <italic>n</italic>=33). Larger inner products indicate stronger correlation. Recommendations for a specific patient were generated based on the inner products between the corresponding patient vector and text vectors.</p>
          <fig id="figure3" position="float">
            <label>Figure 3</label>
            <caption>
              <p>Recommendation generation steps.</p>
            </caption>
            <graphic xlink:href="medinform_v8i4e17642_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
          <table-wrap position="float" id="table1">
            <label>Table 1</label>
            <caption>
              <p>Summary of the three strategies for improving keyword extraction performance.</p>
            </caption>
            <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
              <col width="150"/>
              <col width="410"/>
              <col width="440"/>
              <thead>
                <tr valign="top">
                  <td>Strategy</td>
                  <td>Description</td>
                  <td>Effect</td>
                </tr>
              </thead>
              <tbody>
                <tr valign="top">
                  <td>Weight assignment</td>
                  <td>Assign weight of 3, 1.2, and 0.8 to title words, nouns, and verbs, respectively, when performing keyword extraction.</td>
                  <td>Nouns and title words will be more likely to be keywords, and verbs are less likely to be keywords.</td>
                </tr>
                <tr valign="top">
                  <td>Compound word identification</td>
                  <td> Use several filter conditions to generate user-defined dictionary of compound words in educational materials for word segmentation.</td>
                  <td> Compound words that meet filter conditions will be identified and are more likely to be the keywords than atom words.</td>
                </tr>
                <tr valign="top">
                  <td> Synonym elimination</td>
                  <td> Remove shorter keywords with similar Chinese characters based on cosine similarity between their character compositions.</td>
                  <td> Two or more keyword candidates with similar character composition will be merged into one keyword to avoid redundancy.</td>
                </tr>
              </tbody>
            </table>
          </table-wrap>
          <fig id="figure4" position="float">
            <label>Figure 4</label>
            <caption>
              <p>Concrete calculation process of the text vector.</p>
            </caption>
            <graphic xlink:href="medinform_v8i4e17642_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
          <fig id="figure5" position="float">
            <label>Figure 5</label>
            <caption>
              <p>Inner product of the patient vector and text vector.</p>
            </caption>
            <graphic xlink:href="medinform_v8i4e17642_fig5.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
        <sec>
          <title>Stage 3: mHealth Implementation</title>
          <p>In this stage, we incorporated the recommender system (including the ontology and the algorithm) into our mHealth system for practical use. The entire recommender system was implemented as a Web service connected with the mobile app. For each patient, the service will calculate the specific patient vector and text vectors of documents that have not been provided to the patient, and then calculate the inner products between the patient and text vectors. For the recommendation, to reduce computation, we adopted a thresholding method: if the inner product is greater than a certain threshold, then the corresponding document will be considered to be relevant to the patient. The relevant documents will be added to a recommendation queue, pushed to the patient’s smartphone regularly. In addition, one other thing to note is that documents prohibited for reproduction will only be used for training and not be provided to patients.</p>
        </sec>
      </sec>
      <sec>
        <title>Development Tools</title>
        <p>Development and evaluation of the system were performed on an iMac (21.5-inch) with an Intel Core i7-5775R CPU 3.3 GHz, with 16 GB main memory running on macOS Mojave 10.14.6. We used the Protégé 5.5.0 open source ontology editor to develop the ontology in OWL2 standard format. The Pellet reasoner was used to enable SWRL reasoning under Protégé. The algorithm for recommendation generation was implemented using Python 3.6 (for source code see Wang and Huang [<xref ref-type="bibr" rid="ref48">48</xref>]). Several Python libraries have been imported to process the materials: for material retrieval, the Beautiful Soup library (version 4.4.0) was adopted to pull data out of HTML files and transform it into plain text; for keyword extraction, the Jieba library (version 0.39) was adopted for Chinese text segmentation; and for pretrained word embeddings, the Gensim library (version 3.8.1) [<xref ref-type="bibr" rid="ref49">49</xref>] was adopted to train the Word2Vec model. The Web service was developed under the Flask framework (a lightweight Web app framework for Python), in which the OWLready2 library (version 0.23) [<xref ref-type="bibr" rid="ref50">50</xref>] was used to manipulate the OWL2 ontology. System evaluation was conducted using Python 3.6.</p>
      </sec>
      <sec>
        <title>System Evaluation</title>
        <sec>
          <title>Test Collection Assembly</title>
          <p>To evaluate system performance, we invited 2 domain experts to assist in assembling a test collection of educational materials. These domain experts are case managers from the General Hospital of Ningxia Medical University. Their daily work is conducting follow-ups on chronic disease patients and providing health education for these patients. Considering the time cost of manual annotation, based on a study in this field [<xref ref-type="bibr" rid="ref37">37</xref>], 100 educational documents were randomly selected from the corpus to compose the test collection. The system performance evaluation was divided into two parts: evaluation of keyword extraction performance and evaluation of recommendation performance.</p>
        </sec>
        <sec>
          <title>Evaluation of Keyword Extraction Performance</title>
          <p>We asked one expert to extract 5 keywords from each document in the test collection (the other expert reviewed the results). The keywords must have explicitly appeared in the text. We then compared the automatically extracted keywords by the algorithms with the manual extraction results. The evaluation metric was the precision of automatic extraction for the entire test collection, inspired by the evaluation method of TextRank [<xref ref-type="bibr" rid="ref45">45</xref>], as shown in <xref rid="figure6" ref-type="fig">Figure 6</xref>. In this study, since the extracted word counts of manual annotation and algorithms are identical, precision equals recall—the fraction of correctly extracted keywords by algorithms out of the total correct keywords (N=500).</p>
          <fig id="figure6" position="float">
            <label>Figure 6</label>
            <caption>
              <p>Evaluation metrics of keyword extraction performance.</p>
            </caption>
            <graphic xlink:href="medinform_v8i4e17642_fig6.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
        <sec>
          <title>Evaluation of Recommendation Performance</title>
          <p>We asked another expert to assign a recommendation score to each document in the test collection for each patient, inspired by Zeng et al [<xref ref-type="bibr" rid="ref37">37</xref>]. The other expert reviewed the results. For the pairing of patient data <italic>p</italic> and educational material document <italic>d</italic>, the expert assigned a score in the range of 0 to 2 to indicate if <italic>d</italic> was appropriate to recommend to <italic>p</italic>, where 0 indicated no need, 1 partial need, and 2 most need. According to the inner products between the patient vector and text vectors, a ranked sequence of the test collection was returned by the system for each patient. System performance was evaluated based on the precision of top <italic>k</italic> retrieved documents, as shown in <xref rid="figure7" ref-type="fig">Figure 7</xref>, where a partial need document was counted as 0.5. Since different patients have different precisions at <italic>k</italic>, we used the macro precision and the overall mean average precision (MAP) to evaluate the system performance, as shown in <xref rid="figure7" ref-type="fig">Figure 7</xref>, where <italic>m</italic> corresponds to the total number of patients (<italic>m</italic>=50), <italic>n</italic> corresponds to the total number of retrieved documents (<italic>n</italic>=100), (P @ <italic>k</italic>)<italic><sub>i</sub></italic> corresponds to the precision at <italic>k</italic> for patient <italic>i</italic>, rel<italic><sub>i</sub></italic> (<italic>k</italic>) is an indicator function equaling 1 if the item at rank <italic>k</italic> is a relevant document, zero otherwise (for patient <italic>i</italic>).</p>
          <fig id="figure7" position="float">
            <label>Figure 7</label>
            <caption>
              <p>Evaluation metrics of recommendation performance.</p>
            </caption>
            <graphic xlink:href="medinform_v8i4e17642_fig7.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Overall Statistics</title>
        <sec>
          <title>Patient Statistics</title>
          <p><xref ref-type="table" rid="table2">Table 2</xref> shows a summary of the collected patient data. The patients were 50 adults with an average age of 57 years. Their characteristics were divided into 5 categories: demographics, disease history, laboratory tests, self-monitoring, and questionnaires. Among these categories, demographic data, disease history data, and laboratory test data came from the patients’ corresponding electronic health records, while questionnaire and self-monitoring data came from the patients’ daily use records of the system. For self-monitoring data, we extracted the most recent week’s records for each patient (by the end of July 2019). For questionnaire data, the 9-item Patient Health Questionnaire [<xref ref-type="bibr" rid="ref51">51</xref>] and International Physical Activity Questionnaire [<xref ref-type="bibr" rid="ref52">52</xref>] were used to assess the depression level and physical activity level of patients, respectively. We extracted the latest record of each patient’s questionnaire data. In recommendation generation, all the patient data were mapped to the ontology vector space with a severity level ranging from 0 to 3.</p>
          <table-wrap position="float" id="table2">
            <label>Table 2</label>
            <caption>
              <p>Patient characteristics from the collected data (n=50).</p>
            </caption>
            <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
              <col width="30"/>
              <col width="30"/>
              <col width="720"/>
              <col width="220"/>
              <thead>
                <tr valign="top">
                  <td colspan="3">Patient characteristics</td>
                  <td>Value</td>
                </tr>
              </thead>
              <tbody>
                <tr valign="top">
                  <td colspan="3">
                    <bold>Demographic</bold>
                  </td>
                  <td>
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td colspan="2">
                    <bold>Sex, n (%)</bold>
                  </td>
                  <td>
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>Female</td>
                  <td>23 (46)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>Male</td>
                  <td>27 (54)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td colspan="2">Age in years, mean (SD)</td>
                  <td>57 (0.57)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td colspan="2">
                    <bold>Body mass index (kg/m  <sup>2</sup>), n (%)</bold>
                  </td>
                  <td>
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>Normal<sup>a</sup></td>
                  <td>16 (32)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>Overweight</td>
                  <td>34 (68)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td colspan="2">
                    <bold>Pregnancy, n (%)</bold>
                  </td>
                  <td>
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>Pregnant</td>
                  <td>0 (0)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>Nonpregnant</td>
                  <td>50 (100)</td>
                </tr>
                <tr valign="top">
                  <td colspan="3">
                    <bold>Disease history, n (%)</bold>
                  </td>
                  <td>
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td colspan="2">Hypertension</td>
                  <td>50 (100)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td colspan="2">Diabetes</td>
                  <td>6 (12)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td colspan="2">Stroke</td>
                  <td>4 (8)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td colspan="2">Hyperlipidemia</td>
                  <td>12 (24)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td colspan="2"> Coronary artery disease</td>
                  <td>3 (6)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td colspan="2">Chronic obstructive pulmonary disease</td>
                  <td>2 (4)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td colspan="2">Other diseases</td>
                  <td>17 (34)</td>
                </tr>
                <tr valign="top">
                  <td colspan="3">
                    <bold>Laboratory test, n (%)</bold>
                  </td>
                  <td>
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td colspan="2"> Blood glucose (normal)<sup>b</sup></td>
                  <td>36 (72)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td colspan="2"> Total cholesterol (normal)<sup>c</sup></td>
                  <td>36 (72)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td colspan="2"> Triglyceride (normal)<sup>d</sup></td>
                  <td>29 (58)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td colspan="2"> High density lipoprotein (normal)<sup>e</sup></td>
                  <td>43 (86)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td colspan="2">Low density lipoprotein (normal)<sup>f</sup></td>
                  <td>40 (80)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td colspan="2"> Uric acid (normal)<sup>g</sup></td>
                  <td>39 (78)</td>
                </tr>
                <tr valign="top">
                  <td colspan="3">
                    <bold>Self-monitoring data, n (%)</bold>
                  </td>
                  <td>
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td colspan="2">
                    <bold>Blood pressure</bold>
                  </td>
                  <td>
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>Normal<sup>h</sup></td>
                  <td>23 (46)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>Abnormal</td>
                  <td>27 (54)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td colspan="2">
                    <bold>Smoking and drinking</bold>
                  </td>
                  <td>
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>Smoking</td>
                  <td>7 (14)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>Drinking</td>
                  <td>9 (18)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td colspan="2">
                    <bold>Diet</bold>
                  </td>
                  <td>
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>Good</td>
                  <td>19 (38)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>Medium</td>
                  <td>27 (54)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>Poor</td>
                  <td>4 (8)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td colspan="2">
                    <bold>Medication</bold>
                  </td>
                  <td>
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>Antihypertensive drugs</td>
                  <td>50 (100)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>Hypoglycemic drugs</td>
                  <td>3 (6)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>Hypolipidemic drugs</td>
                  <td>12 (24)</td>
                </tr>
                <tr valign="top">
                  <td colspan="3">
                    <bold>Questionnaire, n (%)</bold>
                  </td>
                  <td>
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td colspan="2">
                    <bold>9-item Patient Health Questionnaire</bold>
                  </td>
                  <td>
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>Minimal depression</td>
                  <td>33 (66)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>Mild depression</td>
                  <td>12 (24)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>Moderate depression</td>
                  <td>3 (6)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>Moderately severe depression</td>
                  <td>2 (4)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>Severe depression</td>
                  <td>0 (0)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td colspan="2">
                    <bold>International Physical Activity Questionnaire</bold>
                  </td>
                  <td>
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>High physical activity level</td>
                  <td>18 (36)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>Moderate physical activity level</td>
                  <td>23 (46)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>Low physical activity level</td>
                  <td>9 (18)</td>
                </tr>
              </tbody>
            </table>
            <table-wrap-foot>
              <fn id="table2fn1">
                <p><sup>a</sup>Reference range of body mass index: 18.5-23.9 kg/m<sup>2</sup> for Chinese patients.</p>
              </fn>
              <fn id="table2fn2">
                <p><sup>b</sup>Reference range of blood glucose: 3.9-6.1 mmol/L.</p>
              </fn>
              <fn id="table2fn3">
                <p><sup>c</sup>Reference range of total cholesterol: 2.9-5.2 mmol/L.</p>
              </fn>
              <fn id="table2fn4">
                <p><sup>d</sup>Reference range of triglyceride: 0.56-1.70 mmol/L.</p>
              </fn>
              <fn id="table2fn5">
                <p><sup>e</sup>Reference range of high density lipoprotein: 1.20-1.68 mmol/L.</p>
              </fn>
              <fn id="table2fn6">
                <p><sup>f</sup>Reference range of low density lipoprotein: 2.07-3.12 mmol/L.</p>
              </fn>
              <fn id="table2fn7">
                <p><sup>g</sup>Reference range of uric acid: 149-416 μmol/L (for men under 60), 89-357 μmol/L (for women under 60), 250-476 μmol/L (for men over 60), 190-434 μmol/L (for women over 60).</p>
              </fn>
              <fn id="table2fn8">
                <p><sup>h</sup>Reference range of blood pressure: 90-119 mm Hg for systolic BP, 60-79 mm Hg for diastolic BP.</p>
              </fn>
            </table-wrap-foot>
          </table-wrap>
        </sec>
        <sec>
          <title>Material Statistics</title>
          <p><xref ref-type="table" rid="table3">Table 3</xref> shows an overview of the entire corpus (88,746 documents) and the test collection (100 documents). The mean document length (word count) was 490 (SD 387) and 719 (SD 462) for the corpus and the test collection, respectively. The unique word count in the entire corpus was 270,591 with 10,707 in the test collection. <xref rid="figure8" ref-type="fig">Figure 8</xref> shows the topic distribution of the test collection, in which we counted the number of documents related to each term in the ontology vector space based on the mapping method mentioned in stage 2. Among the 33 terms, hypertension, diabetes, diet, blood glucose, and antihypertensive drug were the most common topics discussed by educational materials in the test collection.</p>
          <table-wrap position="float" id="table3">
            <label>Table 3</label>
            <caption>
              <p>Overview of the entire corpus and the test collection.</p>
            </caption>
            <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
              <col width="220"/>
              <col width="150"/>
              <col width="220"/>
              <col width="250"/>
              <col width="160"/>
              <thead>
                <tr valign="top">
                  <td>Corpus</td>
                  <td>Number</td>
                  <td>Total word count</td>
                  <td>Word count, mean (SD)</td>
                  <td>Unique word count</td>
                </tr>
              </thead>
              <tbody>
                <tr valign="top">
                  <td>Entire corpus</td>
                  <td>88,746</td>
                  <td>40,797,062</td>
                  <td>490 (387)</td>
                  <td>270,591</td>
                </tr>
                <tr valign="top">
                  <td>Test collection</td>
                  <td>100</td>
                  <td>71,905</td>
                  <td>719 (462)</td>
                  <td>10,707</td>
                </tr>
              </tbody>
            </table>
          </table-wrap>
          <fig id="figure8" position="float">
            <label>Figure 8</label>
            <caption>
              <p>Topic distribution of the test collection.</p>
            </caption>
            <graphic xlink:href="medinform_v8i4e17642_fig8.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
      </sec>
      <sec>
        <title>System Development Results</title>
        <sec>
          <title>Stage 1: Ontology Construction</title>
          <p>The current version of CDPEO contained 40 classes, 31 object properties, 67 data properties, and 32 individuals (see <xref ref-type="supplementary-material" rid="app4">Multimedia Appendix 4</xref> for the detailed ontology nonzero metrics). As mentioned before, CDPEO mainly consisted of two levels: 5 terms that described patient characteristics (level 1) and the detailed elements for each term (level 2). The patient profile class was used to generate the instance of patient data, using object properties to connect to specific characteristic instances. These properties were also described as a set of universal restrictions to specify the complete semantics. All specific characteristic instances contained one or more data properties to describe the concrete value of that characteristic. For example, for blood pressure, the data property connected to two double-type values representing systolic and diastolic BP; while for smoking, the data property connected to an integer type value that describes the daily cigarette count of the patient. <xref rid="figure9" ref-type="fig">Figure 9</xref> shows the class diagram of CDPEO’s main core. We have not added all the classes and properties in order to keep the figure simple. CDPEO is publicly available and can be freely downloaded from BioPortal [<xref ref-type="bibr" rid="ref53">53</xref>].</p>
          <p>The 33-dimensional ontology vector space was generated from the level 2 classes, in which each dimension corresponds to a term describing patient characteristics and document topics (originally in Chinese), as shown in <xref rid="figure8" ref-type="fig">Figure 8</xref>. A total of 80 SWRL rules were defined to implement the semantic logic of mapping patient original data to the ontology vector space. The complete SWRL list can be found in <xref ref-type="supplementary-material" rid="app4">Multimedia Appendix 4</xref> as well.</p>
          <fig id="figure9" position="float">
            <label>Figure 9</label>
            <caption>
              <p>Class diagram of the Chronic Disease Patient Education Ontology’s main core.</p>
            </caption>
            <graphic xlink:href="medinform_v8i4e17642_fig9.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
        <sec>
          <title>Stage 2: Recommendation Generation</title>
          <p>The patient vectors were generated by the SWRL rules. In CDPEO, the 33 vector items corresponded to 33 data properties, each with a prefix of vectorItem. The general reasoning procedures of the SWRL rules are as follows: first, the rules took the patient profile instance and the connected characteristic instances (including the specific data values) as inputs and calculated the values of the vector items by using the built-in attributes to perform the logic judgment; second, the rules connected the item values to the patient profile instance via the data properties prefixed with vectorItem.</p>
          <p>The text vectors were generated based on the keywords of each document and the Word2Vec embeddings. The keyword extraction performance was evaluated in the next section. The pretrained embedding for each word in the corpus was a 200-dimensional vector. To intuitively evaluate the performance of the Word2Vec model, we extracted the embeddings of the 33 terms in the ontology vector space, and then visualized them in a 2-dimensional space using principal component analysis [<xref ref-type="bibr" rid="ref54">54</xref>,<xref ref-type="bibr" rid="ref55">55</xref>]. As shown in <xref rid="figure10" ref-type="fig">Figure 10</xref>, terms with similar meanings tended to have embeddings with similar directions (eg, male and female), which proves that the pretrained Word2Vec embeddings were able to capture the semantic meanings behind the words. Therefore, we used the Word2Vec embeddings to map the extracted keywords to the ontology vector space.</p>
          <p>To better understand the entire recommendation generation process, we selected one patient from the 50 and one document from the test collection to perform a simple case study. <xref rid="figure11" ref-type="fig">Figure 11</xref> shows the complete scenario. The detailed description of this case study can be found in <xref ref-type="supplementary-material" rid="app5">Multimedia Appendix 5</xref>.</p>
          <fig id="figure10" position="float">
            <label>Figure 10</label>
            <caption>
              <p>Word2Vec embedding visualization of the 33 ontology vector items.</p>
            </caption>
            <graphic xlink:href="medinform_v8i4e17642_fig10.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
          <fig id="figure11" position="float">
            <label>Figure 11</label>
            <caption>
              <p>Complete scenario for the recommendation generation process.</p>
            </caption>
            <graphic xlink:href="medinform_v8i4e17642_fig11.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
        <sec>
          <title>Stage 3: mHealth Implementation</title>
          <p>The recommender system was implemented as a part of our mHealth system [<xref ref-type="bibr" rid="ref39">39</xref>]. <xref rid="figure12" ref-type="fig">Figure 12</xref> shows the structure of the system. We designed the recommender system as a separate service, interacting with the app via RESTful APIs [<xref ref-type="bibr" rid="ref56">56</xref>]. As mentioned before, the recommendations were first generated based on a certain threshold, and then added to a recommendation queue waiting to be pushed. In practice, the threshold is configurable, which means care providers can adjust the threshold value based on the actual effect. Considering the sparsity of the vectors, the initial threshold value was relatively small (<italic>v</italic>=2). The system will push the relevant documents to patients’ smartphones every day according to the recommendation queue, and update the patient and text vectors to add new relevant documents to the queue. Recommendations will be displayed in the Health Education functional module of the app.</p>
          <fig id="figure12" position="float">
            <label>Figure 12</label>
            <caption>
              <p>Structure of the system.</p>
            </caption>
            <graphic xlink:href="medinform_v8i4e17642_fig12.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
      </sec>
      <sec>
        <title>System Evaluation</title>
        <sec>
          <title>Evaluation of Keyword Extraction Performance</title>
          <p>We extracted 5 keywords for each document in the test collection automatically using 4 different algorithms. The 4 different algorithms were the original TF-IDF and TextRank methods, as well as the modified versions of them with our proposed 3 strategies. The evaluation results are shown in <xref ref-type="table" rid="table4">Table 4</xref>. Among the 4 algorithms, the improved TextRank achieved the best overall precision of 53.2% (266/500), while the improved TF-IDF achieved the worst overall precision of 26.6% (133/500).</p>
          <table-wrap position="float" id="table4">
            <label>Table 4</label>
            <caption>
              <p>Results for automatic keyword extraction using different algorithms.</p>
            </caption>
            <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
              <col width="320"/>
              <col width="100"/>
              <col width="160"/>
              <col width="120"/>
              <col width="120"/>
              <col width="0"/>
              <col width="180"/>
              <thead>
                <tr valign="top">
                  <td> Method</td>
                  <td colspan="2">Automatic extraction</td>
                  <td colspan="2">Correct keywords</td>
                  <td colspan="2">Precision (%)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Total</td>
                  <td>Mean</td>
                  <td>Total</td>
                  <td colspan="2">Mean</td>
                  <td>
                    <break/>
                  </td>
                </tr>
              </thead>
              <tbody>
                <tr valign="top">
                  <td>Improved TextRank</td>
                  <td>500</td>
                  <td>5</td>
                  <td>266</td>
                  <td colspan="2">2.66</td>
                  <td>53.2</td>
                </tr>
                <tr valign="top">
                  <td>Original TextRank</td>
                  <td>500</td>
                  <td>5</td>
                  <td>151</td>
                  <td colspan="2">1.51</td>
                  <td>30.2</td>
                </tr>
                <tr valign="top">
                  <td>Improved TF-IDF<sup>a</sup></td>
                  <td>500</td>
                  <td>5</td>
                  <td>133</td>
                  <td colspan="2">1.33</td>
                  <td>26.6</td>
                </tr>
                <tr valign="top">
                  <td>Original TF-IDF</td>
                  <td>500</td>
                  <td>5</td>
                  <td>206</td>
                  <td colspan="2">2.06</td>
                  <td>41.2</td>
                </tr>
              </tbody>
            </table>
            <table-wrap-foot>
              <fn id="table4fn1">
                <p><sup>a</sup>TF-IDF: term frequency–inverse document frequency.</p>
              </fn>
            </table-wrap-foot>
          </table-wrap>
        </sec>
        <sec>
          <title>Evaluation of Recommendation Performance</title>
          <p>Based on patient data and extracted keywords for each document in the test collection, we calculated the inner products for each patient-document pair and generated the top <italic>k</italic> recommendations. System performance with different extracted keywords is presented in <xref ref-type="table" rid="table5">Table 5</xref> and <xref rid="figure13" ref-type="fig">Figure 13</xref>. The average number of manually annotated appropriate documents for each patient was 41 out of 100, which can be considered as the macro precision for a random recommendation (the dotted red line in <xref rid="figure13" ref-type="fig">Figure 13</xref>).</p>
          <p>Among the 5 methods, the improved TF-IDF achieved the highest macro precision (0.970) at the top 1 recommendation. From the curve, the TF-IDF methods (original and improved version) outperformed the TextRank methods, especially at top 1 to 10 recommendations. The manual annotated keywords had a medium performance at top 1 to 15 recommendations, compared with other methods. As the number of recommendations increases, the performances of each method tended to be closer. For the overall MAP score, manual annotation achieved the highest value (0.635), while the original TextRank achieved the lowest value (0.585). The other 3 methods obtained similar scores (mean 0.623).</p>
          <table-wrap position="float" id="table5">
            <label>Table 5</label>
            <caption>
              <p>Performance comparison among different keyword extraction algorithms for n=50 evaluations (patients).</p>
            </caption>
            <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
              <col width="170"/>
              <col width="70"/>
              <col width="70"/>
              <col width="80"/>
              <col width="90"/>
              <col width="70"/>
              <col width="70"/>
              <col width="80"/>
              <col width="80"/>
              <col width="70"/>
              <col width="70"/>
              <col width="80"/>
              <thead>
                <tr valign="top">
                  <td>Method</td>
                  <td>MAP<sup>a</sup></td>
                  <td colspan="10">Macro Precision</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>P@1</td>
                  <td>P@2</td>
                  <td>P@3</td>
                  <td>P@4</td>
                  <td>P@5</td>
                  <td>P@10</td>
                  <td>P@15</td>
                  <td>P@20</td>
                  <td>P@25</td>
                  <td>P@30</td>
                </tr>
              </thead>
              <tbody>
                <tr valign="top">
                  <td>Improved TextRank</td>
                  <td>0.622</td>
                  <td>0.810</td>
                  <td>0.730</td>
                  <td>0.713</td>
                  <td>0.705</td>
                  <td>0.710</td>
                  <td>0.717</td>
                  <td>0.701</td>
                  <td>0.688</td>
                  <td>0.673</td>
                  <td>0.645</td>
                </tr>
                <tr valign="top">
                  <td>Original TextRank</td>
                  <td>0.585</td>
                  <td>0.610</td>
                  <td>0.600</td>
                  <td>0.650</td>
                  <td>0.648</td>
                  <td>0.642</td>
                  <td>0.661</td>
                  <td>0.665</td>
                  <td>0.662</td>
                  <td>0.646</td>
                  <td>0.641</td>
                </tr>
                <tr valign="top">
                  <td>Improved TF-IDF<sup>b</sup></td>
                  <td>0.620</td>
                  <td>0.970</td>
                  <td>0.920</td>
                  <td>0.880</td>
                  <td>0.845</td>
                  <td>0.822</td>
                  <td>0.741</td>
                  <td>0.715</td>
                  <td>0.677</td>
                  <td>0.651</td>
                  <td>0.632</td>
                </tr>
                <tr valign="top">
                  <td>Original TF-IDF</td>
                  <td>0.628</td>
                  <td>0.930</td>
                  <td>0.875</td>
                  <td>0.867</td>
                  <td>0.853</td>
                  <td>0.836</td>
                  <td>0.772</td>
                  <td>0.723</td>
                  <td>0.680</td>
                  <td>0.660</td>
                  <td>0.634</td>
                </tr>
                <tr valign="top">
                  <td>Manual Annotation</td>
                  <td>0.635</td>
                  <td>0.650</td>
                  <td>0.720</td>
                  <td>0.740</td>
                  <td>0.753</td>
                  <td>0.740</td>
                  <td>0.726</td>
                  <td>0.707</td>
                  <td>0.697</td>
                  <td>0.681</td>
                  <td>0.660</td>
                </tr>
              </tbody>
            </table>
            <table-wrap-foot>
              <fn id="table5fn1">
                <p><sup>a</sup>MAP: mean average precision.</p>
              </fn>
              <fn id="table5fn2">
                <p><sup>b</sup>TF-IDF: term frequency–inverse document frequency.</p>
              </fn>
            </table-wrap-foot>
          </table-wrap>
          <fig id="figure13" position="float">
            <label>Figure 13</label>
            <caption>
              <p>Macro precisions at rank 1 to 30 of different keyword extraction algorithms for n=50 evaluations (patients).</p>
            </caption>
            <graphic xlink:href="medinform_v8i4e17642_fig13.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>In this study, we investigated the use of knowledge-based RAs with a combination of NLP techniques to recommend Chinese educational materials to chronic disease patients. The constructed ontology (CDPEO) can describe patient characteristics, linking them to the topics of educational materials. The recommender system was implemented as a Web service connected with patients’ smartphones. According to the evaluation results, our system achieved a macro precision up to 0.970 for the top 1 recommendation and an overall MAP score up to 0.628.</p>
        <p>Some interesting aspects can be found from the evaluation results. First, the improved TextRank has the potential to be the most suitable keyword extraction algorithm for our system, since it achieved the best performance in keyword extraction and obtained a relatively high score (0.622) for the overall MAP. Second, for the improved TF-IDF, there existed a performance gap between keyword extraction and recommendation. This algorithm achieved the worst performance in keyword extraction; however, it outperformed the other methods in the macro precision of the top 1 to 3 recommendations. This result may be explained by the fact that the improved TF-IDF produced output that tended toward compound words, according to the concrete extraction results. The manually extracted keywords didn’t involve many compound words, which resulted in the low precision of keyword extraction for the improved TF-IDF; however, compound words contained more information than atom words, which is advantageous for recommendation.</p>
        <p>Third, as mentioned in the results section, the TextRank methods didn’t perform as well as the TF-IDF methods in the macro precision of recommendation. This result could be attributed to the different principles behind the two types of methods. In TF-IDF, keywords were extracted based on term frequency and inverse document frequency [<xref ref-type="bibr" rid="ref44">44</xref>], which uses the information of the entire corpus. Further, our compound word identification strategy took the term frequency as an important filter condition, which resulted in the large amount of compound words in the keywords extracted by the improved TF-IDF method. On the other hand, the rationale of TextRank is extracting keywords based on a graph-based ranking model [<xref ref-type="bibr" rid="ref45">45</xref>], which only uses the information of one single document. The information gap between these methods may lead to the different recommendation performances. To summarize, from our results, the performance of keyword extraction didn’t exactly correspond to the recommendation performance. Our strategies for keyword extraction have different effects on different algorithms. The recommendation performance is closely related to the rationales behind the algorithms.</p>
      </sec>
      <sec>
        <title>Comparison With Prior Work</title>
        <p>To better delineate the contribution of this paper, we compared our study with prior work in two aspects. In terms of keyword extraction, several studies have explored the effect of traditional techniques combined with improvement strategies to extract keywords from Chinese documents. Li et al [<xref ref-type="bibr" rid="ref57">57</xref>] proposed a new keyword extraction method for news documents based on TF-IDF with multistrategies. They first performed word segmentation to obtain candidate keywords of uni-, bi- and trigrams, meanwhile recognizing unknown candidate keywords based on several measures; they then calculated the features of keyword candidates to get the final keywords according to their morphological characters and context information. Wang et al [<xref ref-type="bibr" rid="ref58">58</xref>] designed a hybrid keyword extraction method based on TF and semantic strategies. Similarly, they obtained candidate keywords based on word segmentation results and a new word-finding method, and then performed feature calculation for each candidate word and introduced several strategies to filter dependent words and remove synonyms. Zhao et al [<xref ref-type="bibr" rid="ref59">59</xref>] applied semantic similarity computation and the frequent pattern growth algorithm to mine candidate keyword sets, and then calculated the weight of each candidate word based on frequency, part of speech, and position information.</p>
        <p>Compared with these studies, our strategies for keyword extraction focused on patient educational materials, and extracted keywords were used as inputs for recommendation generation. The different application scenarios and objectives led to the difference in implementation details of our strategies. In weight assignment, we considered the part of speech (nouns and verbs) and the position of words (in titles) together while prior studies usually treated these items separately. In compound word identification, we recognized the compound words before the formal word segmentation and generated a user-defined dictionary to customize the word segmentation, while prior studies chose to identify such unknown words after word segmentation. In synonym elimination, we identified the synonyms by calculating the cosine similarity between character compositions of keywords, which had not been proposed in prior studies. Furthermore, we applied our strategies to two different algorithms. From the evaluation results, these strategies had a better effect on the TextRank algorithm than the TF-IDF algorithm.</p>
        <p>In terms of the entire recommender system, several studies concerned with HRS for patient education have been described in the introduction section. Compared with these studies, our study was innovative in a few ways. First, our system was designed as a knowledge-based HRS, using ontologies to model patient characteristics, while prior studies generally adopted an IR approach [<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref37">37</xref>] or traditional RAs [<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref38">38</xref>]. Second, to the best of our knowledge, this study is the first to explore the feasibility of recommending Chinese materials using information technologies in the field of patient education. Since preprocessing procedures for Chinese documents are quite different from English documents (eg, the word segmentation), our method can provide constructive guidance to future research.</p>
      </sec>
      <sec>
        <title>Strengths and Limitations</title>
        <p>Our study has several strengths. First, the vectors used for recommendation generation is adaptable to specific requirements. With simple adjustment of ontology vector space by adding or deleting terms, patient and text vectors will be automatically generated. Second, recommendations generated through our method are more interpretable than traditional methods (such as content-based methods and collaborative filtering). In traditional methods, results are generated according to users’ previous ratings, which lacks a strong explanation for the current recommendations. However, in our study, the results can be explained based on the co-occurrent nonzero items in these two vectors. A larger product of the corresponding item indicates a higher relevance of the specific characteristic (topic) between the patient and the educational item. Third, the system was implemented as a Web service of our mHealth system. Patients are able to view daily updates about personalized health information on their smartphones, which provides possibility for large-scale practical application and evaluation in the future.</p>
        <p>A number of potential methodological weaknesses need to be acknowledged. First, the NLP techniques used in this study are mainly word-level techniques, which may not be able to capture the deep semantic meanings behind sentences or documents. The keyword extraction algorithms are word-level statistical methods and the Word2Vec model produces static word embeddings instead of contextual word embeddings. Moreover, the precision of keyword extraction remains to be improved. Second, the constructed ontology and SWRL rules remain to be further validated for their consistency, correctness, and completeness.</p>
        <p>In addition, validity of the test collection was limited as well. Potential selection bias may exist in terms of patients and educational materials. According to the statistics, the average age of the patients was 57 years, which means the effect of our recommender system for younger patients is unknown; the mean length of the selected materials was greater than the entire corpus, which means the effect of our method on shorter text needs further investigation. Moreover, the scale of the test collection was relatively small, and manual annotation was completed by two experts separately without strict validation. The precision of 1-patient recommendation may have a great impact on the macro precision and overall MAP score.</p>
      </sec>
      <sec>
        <title>Future Work</title>
        <p>In future work, we will test the effect of our method on a larger test collection. Comparison tests should be conducted to determine if our system can perform well at a larger scale. We also plan to evaluate the system for patients in a broader age distribution and involve patients in the assessment procedures. Currently, evaluation of relevance is done by case managers only, and their opinions may differ from the patients’ perceived usefulness. The opinions of patients can be used to strengthen the recommender system as well. Another direction for future work is to explore a new sentence-level or document-level approach to understand the deep semantic meanings of the materials. For example, the feasibility of applying a pretrained language model (such as bidirectional encoder representation from transformers [<xref ref-type="bibr" rid="ref60">60</xref>] and XLNet [<xref ref-type="bibr" rid="ref61">61</xref>]) combined with a downstream task (such as multilabel classification) would be investigated.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>This study has shown that a knowledge-based recommender system has the potential to accurately recommend health educational materials to chronic disease patients. Patient characteristics can be linked to document topics through the ontology. NLP techniques such as keyword extraction and pretrained word embeddings proved to be effective for processing educational materials. Furthermore, documents in Chinese have different preprocessing procedures from those in English. Our study indicates that traditional techniques combined with several strategies for specific language and domain can improve the final results to a certain extent. Further research might investigate the use of other state-of-the-art NLP techniques in HRS for better precision or explore the effect of such systems from the perspective of patients in a practical setting.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Detailed information about material sources.</p>
        <media xlink:href="medinform_v8i4e17642_app1.pdf" xlink:title="PDF File  (Adobe PDF File), 295 KB"/>
      </supplementary-material>
      <supplementary-material id="app2">
        <label>Multimedia Appendix 2</label>
        <p>Detailed outputs in the first three steps of the Chronic Disease Patient Education Ontology construction.</p>
        <media xlink:href="medinform_v8i4e17642_app2.pdf" xlink:title="PDF File  (Adobe PDF File), 137 KB"/>
      </supplementary-material>
      <supplementary-material id="app3">
        <label>Multimedia Appendix 3</label>
        <p>Examples of the three improvement strategies for keyword extraction.</p>
        <media xlink:href="medinform_v8i4e17642_app3.pdf" xlink:title="PDF File  (Adobe PDF File), 99 KB"/>
      </supplementary-material>
      <supplementary-material id="app4">
        <label>Multimedia Appendix 4</label>
        <p>Detailed metrics and Semantic Web Rule Language rule list of the Chronic Disease Patient Education Ontology.</p>
        <media xlink:href="medinform_v8i4e17642_app4.pdf" xlink:title="PDF File  (Adobe PDF File), 192 KB"/>
      </supplementary-material>
      <supplementary-material id="app5">
        <label>Multimedia Appendix 5</label>
        <p>Case study of the recommendation generation.</p>
        <media xlink:href="medinform_v8i4e17642_app5.pdf" xlink:title="PDF File  (Adobe PDF File), 337 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">API</term>
          <def>
            <p>application programming interface</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">BP</term>
          <def>
            <p>blood pressure</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">CDPEO</term>
          <def>
            <p>Chronic Disease Patient Education Ontology</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">HRS</term>
          <def>
            <p>health recommender system</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">IR</term>
          <def>
            <p>information retrieval</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">MAP</term>
          <def>
            <p>mean average precision</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">mHealth</term>
          <def>
            <p>mobile health</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">NLP</term>
          <def>
            <p>natural language processing</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb9">OWL</term>
          <def>
            <p>W3C Web Ontology Language</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb10">RA</term>
          <def>
            <p>recommendation algorithm</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb11">SNOMED-CT</term>
          <def>
            <p>Systematized Nomenclature of Medicine–Clinical Terms</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb12">SWRL</term>
          <def>
            <p>Semantic Web Rule Language</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb13">TF-IDF</term>
          <def>
            <p>term frequency–inverse document frequency</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>This study was supported by the National Key Research and Development Program of China (No. 2018YFC0910503, No. 2016YFC0901703, and No. 2017YFC0114105), the Key Research and Development Program of Ningxia Hui Autonomous of China (No. 2018BFG02009), and the Open Fund of Engineering Research Center of Cognitive Healthcare of Zhejiang Province (Sir Run Run Shaw Hospital), China (No. 2018KFJJ02).</p>
    </ack>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <collab>World Health Organization</collab>
          </person-group>
          <source>Global status report on noncommunicable diseases 2014</source>
          <access-date>2020-04-08</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://apps.who.int/iris/bitstream/10665/148114/1/9789241564854_eng.pdf?ua=1">http://apps.who.int/iris/bitstream/10665/148114/1/9789241564854_eng.pdf?ua=1</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Reynolds</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Dennis</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Hasan</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Slewa</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Tian</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Bobba</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zwar</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>A systematic review of chronic disease management interventions in primary care</article-title>
          <source>BMC Fam Pract</source>
          <year>2018</year>
          <month>01</month>
          <day>09</day>
          <volume>19</volume>
          <issue>1</issue>
          <fpage>11</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcfampract.biomedcentral.com/articles/10.1186/s12875-017-0692-3"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12875-017-0692-3</pub-id>
          <pub-id pub-id-type="medline">29316889</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12875-017-0692-3</pub-id>
          <pub-id pub-id-type="pmcid">PMC5759778</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Greene</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Hibbard</surname>
              <given-names>JH</given-names>
            </name>
          </person-group>
          <article-title>Why does patient activation matter? An examination of the relationships between patient activation and health-related outcomes</article-title>
          <source>J Gen Intern Med</source>
          <year>2012</year>
          <month>05</month>
          <volume>27</volume>
          <issue>5</issue>
          <fpage>520</fpage>
          <lpage>526</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/22127797"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s11606-011-1931-2</pub-id>
          <pub-id pub-id-type="medline">22127797</pub-id>
          <pub-id pub-id-type="pmcid">PMC3326094</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Berkman</surname>
              <given-names>ND</given-names>
            </name>
            <name name-style="western">
              <surname>Sheridan</surname>
              <given-names>SL</given-names>
            </name>
            <name name-style="western">
              <surname>Donahue</surname>
              <given-names>KE</given-names>
            </name>
            <name name-style="western">
              <surname>Halpern</surname>
              <given-names>DJ</given-names>
            </name>
            <name name-style="western">
              <surname>Crotty</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Low health literacy and health outcomes: an updated systematic review</article-title>
          <source>Ann Intern Med</source>
          <year>2011</year>
          <month>07</month>
          <day>19</day>
          <volume>155</volume>
          <issue>2</issue>
          <fpage>97</fpage>
          <lpage>107</lpage>
          <pub-id pub-id-type="doi">10.7326/0003-4819-155-2-201107190-00005</pub-id>
          <pub-id pub-id-type="medline">21768583</pub-id>
          <pub-id pub-id-type="pii">155/2/97</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Lang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Xuan</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>The effect of health literacy and self-management efficacy on the health-related quality of life of hypertensive patients in a western rural area of China: a cross-sectional study</article-title>
          <source>Int J Equity Health</source>
          <year>2017</year>
          <month>07</month>
          <day>01</day>
          <volume>16</volume>
          <issue>1</issue>
          <fpage>58</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://equityhealthj.biomedcentral.com/articles/10.1186/s12939-017-0551-9"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12939-017-0551-9</pub-id>
          <pub-id pub-id-type="medline">28666443</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12939-017-0551-9</pub-id>
          <pub-id pub-id-type="pmcid">PMC5493849</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Geboers</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>de Winter</surname>
              <given-names>AF</given-names>
            </name>
            <name name-style="western">
              <surname>Spoorenberg</surname>
              <given-names>SLW</given-names>
            </name>
            <name name-style="western">
              <surname>Wynia</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Reijneveld</surname>
              <given-names>SA</given-names>
            </name>
          </person-group>
          <article-title>The association between health literacy and self-management abilities in adults aged 75 and older, and its moderators</article-title>
          <source>Qual Life Res</source>
          <year>2016</year>
          <month>11</month>
          <volume>25</volume>
          <issue>11</issue>
          <fpage>2869</fpage>
          <lpage>2877</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/27101999"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s11136-016-1298-2</pub-id>
          <pub-id pub-id-type="medline">27101999</pub-id>
          <pub-id pub-id-type="pii">10.1007/s11136-016-1298-2</pub-id>
          <pub-id pub-id-type="pmcid">PMC5065597</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cooper</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Booth</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Fear</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Gill</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Chronic disease patient education: lessons from meta-analyses</article-title>
          <source>Patient Educ Couns</source>
          <year>2001</year>
          <month>08</month>
          <volume>44</volume>
          <issue>2</issue>
          <fpage>107</fpage>
          <lpage>117</lpage>
          <pub-id pub-id-type="doi">10.1016/s0738-3991(00)00182-8</pub-id>
          <pub-id pub-id-type="medline">11479051</pub-id>
          <pub-id pub-id-type="pii">S0738-3991(00)00182-8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Stenberg</surname>
              <given-names>U</given-names>
            </name>
            <name name-style="western">
              <surname>Haaland-Øverby</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Fredriksen</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Westermann</surname>
              <given-names>KF</given-names>
            </name>
            <name name-style="western">
              <surname>Kvisvik</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>A scoping review of the literature on benefits and challenges of participating in patient education programs aimed at promoting self-management for people living with chronic illness</article-title>
          <source>Patient Educ Couns</source>
          <year>2016</year>
          <month>11</month>
          <volume>99</volume>
          <issue>11</issue>
          <fpage>1759</fpage>
          <lpage>1771</lpage>
          <pub-id pub-id-type="doi">10.1016/j.pec.2016.07.027</pub-id>
          <pub-id pub-id-type="medline">27461944</pub-id>
          <pub-id pub-id-type="pii">S0738-3991(16)30322-6</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Coppola</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sasso</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Bagnasco</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Giustina</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Gazzaruso</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>The role of patient education in the prevention and management of type 2 diabetes: an overview</article-title>
          <source>Endocrine</source>
          <year>2016</year>
          <month>07</month>
          <volume>53</volume>
          <issue>1</issue>
          <fpage>18</fpage>
          <lpage>27</lpage>
          <pub-id pub-id-type="doi">10.1007/s12020-015-0775-7</pub-id>
          <pub-id pub-id-type="medline">26494579</pub-id>
          <pub-id pub-id-type="pii">10.1007/s12020-015-0775-7</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gee</surname>
              <given-names>PM</given-names>
            </name>
            <name name-style="western">
              <surname>Greenwood</surname>
              <given-names>DA</given-names>
            </name>
            <name name-style="western">
              <surname>Paterniti</surname>
              <given-names>DA</given-names>
            </name>
            <name name-style="western">
              <surname>Ward</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Miller</surname>
              <given-names>LMS</given-names>
            </name>
          </person-group>
          <article-title>The eHealth Enhanced Chronic Care Model: a theory derivation approach</article-title>
          <source>J Med Internet Res</source>
          <year>2015</year>
          <volume>17</volume>
          <issue>4</issue>
          <fpage>e86</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.jmir.org/2015/4/e86/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/jmir.4067</pub-id>
          <pub-id pub-id-type="medline">25842005</pub-id>
          <pub-id pub-id-type="pii">v17i4e86</pub-id>
          <pub-id pub-id-type="pmcid">PMC4398883</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rush</surname>
              <given-names>KL</given-names>
            </name>
            <name name-style="western">
              <surname>Hatt</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Janke</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Burton</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Ferrier</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Tetrault</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>The efficacy of telehealth delivered educational approaches for patients with chronic diseases: a systematic review</article-title>
          <source>Patient Educ Couns</source>
          <year>2018</year>
          <month>08</month>
          <volume>101</volume>
          <issue>8</issue>
          <fpage>1310</fpage>
          <lpage>1321</lpage>
          <pub-id pub-id-type="doi">10.1016/j.pec.2018.02.006</pub-id>
          <pub-id pub-id-type="medline">29486994</pub-id>
          <pub-id pub-id-type="pii">S0738-3991(18)30053-3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Win</surname>
              <given-names>KT</given-names>
            </name>
            <name name-style="western">
              <surname>Hassan</surname>
              <given-names>NM</given-names>
            </name>
            <name name-style="western">
              <surname>Bonney</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Iverson</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Benefits of online health education: perception from consumers and health professionals</article-title>
          <source>J Med Syst</source>
          <year>2015</year>
          <month>03</month>
          <volume>39</volume>
          <issue>3</issue>
          <fpage>27</fpage>
          <pub-id pub-id-type="doi">10.1007/s10916-015-0224-4</pub-id>
          <pub-id pub-id-type="medline">25666928</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Win</surname>
              <given-names>KT</given-names>
            </name>
            <name name-style="western">
              <surname>Hassan</surname>
              <given-names>NM</given-names>
            </name>
            <name name-style="western">
              <surname>Oinas-Kukkonen</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Probst</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Online patient education for chronic disease management: consumer perspectives</article-title>
          <source>J Med Syst</source>
          <year>2016</year>
          <month>04</month>
          <volume>40</volume>
          <issue>4</issue>
          <fpage>88</fpage>
          <pub-id pub-id-type="doi">10.1007/s10916-016-0438-0</pub-id>
          <pub-id pub-id-type="medline">26846749</pub-id>
          <pub-id pub-id-type="pii">10.1007/s10916-016-0438-0</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kanthawala</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Vermeesch</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Given</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Huh</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Answers to health questions: internet search results versus online health community responses</article-title>
          <source>J Med Internet Res</source>
          <year>2016</year>
          <month>04</month>
          <day>28</day>
          <volume>18</volume>
          <issue>4</issue>
          <fpage>e95</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.jmir.org/2016/4/e95/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/jmir.5369</pub-id>
          <pub-id pub-id-type="medline">27125622</pub-id>
          <pub-id pub-id-type="pii">v18i4e95</pub-id>
          <pub-id pub-id-type="pmcid">PMC4865652</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Deng</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Hinz</surname>
              <given-names>O</given-names>
            </name>
          </person-group>
          <article-title>The health information seeking and usage behavior intention of Chinese consumers through mobile phones</article-title>
          <source>Info Technol People</source>
          <year>2015</year>
          <month>06</month>
          <volume>28</volume>
          <issue>2</issue>
          <fpage>405</fpage>
          <lpage>423</lpage>
          <pub-id pub-id-type="doi">10.1108/ITP-03-2014-0053</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Arsenault</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Blouin</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Guitton</surname>
              <given-names>MJ</given-names>
            </name>
          </person-group>
          <article-title>Information quality and dynamics of patients' interactions on tonsillectomy web resources</article-title>
          <source>Internet Interv</source>
          <year>2016</year>
          <month>05</month>
          <volume>4</volume>
          <fpage>99</fpage>
          <lpage>104</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S2214-7829(15)30025-7"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.invent.2016.05.002</pub-id>
          <pub-id pub-id-type="medline">30135795</pub-id>
          <pub-id pub-id-type="pii">S2214-7829(15)30025-7</pub-id>
          <pub-id pub-id-type="pmcid">PMC6096116</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Beaunoyer</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Arsenault</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Lomanowska</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Guitton</surname>
              <given-names>MJ</given-names>
            </name>
          </person-group>
          <article-title>Understanding online health information: evaluation, tools, and strategies</article-title>
          <source>Patient Educ Couns</source>
          <year>2017</year>
          <month>02</month>
          <volume>100</volume>
          <issue>2</issue>
          <fpage>183</fpage>
          <lpage>189</lpage>
          <pub-id pub-id-type="doi">10.1016/j.pec.2016.08.028</pub-id>
          <pub-id pub-id-type="medline">27595436</pub-id>
          <pub-id pub-id-type="pii">S0738-3991(16)30402-5</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Miller</surname>
              <given-names>LMS</given-names>
            </name>
            <name name-style="western">
              <surname>Bell</surname>
              <given-names>RA</given-names>
            </name>
          </person-group>
          <article-title>Online health information seeking: the influence of age, information trustworthiness, and search challenges</article-title>
          <source>J Aging Health</source>
          <year>2012</year>
          <month>04</month>
          <volume>24</volume>
          <issue>3</issue>
          <fpage>525</fpage>
          <lpage>541</lpage>
          <pub-id pub-id-type="doi">10.1177/0898264311428167</pub-id>
          <pub-id pub-id-type="medline">22187092</pub-id>
          <pub-id pub-id-type="pii">0898264311428167</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ren</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Deng</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Hong</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>Health information in the digital age: an empirical study of the perceived benefits and costs of seeking and using health information from online sources</article-title>
          <source>Health Info Libr J</source>
          <year>2019</year>
          <month>06</month>
          <volume>36</volume>
          <issue>2</issue>
          <fpage>153</fpage>
          <lpage>167</lpage>
          <pub-id pub-id-type="doi">10.1111/hir.12250</pub-id>
          <pub-id pub-id-type="medline">30737878</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kandula</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Curtis</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Hill</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Zeng-Treitler</surname>
              <given-names>Q</given-names>
            </name>
          </person-group>
          <article-title>Use of topic modeling for recommending relevant education material to diabetic patients</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2011</year>
          <volume>2011</volume>
          <fpage>674</fpage>
          <lpage>682</lpage>
          <pub-id pub-id-type="medline">22195123</pub-id>
          <pub-id pub-id-type="pmcid">PMC3243223</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>YL</given-names>
            </name>
            <name name-style="western">
              <surname>Kuo</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Shiu</surname>
              <given-names>YS</given-names>
            </name>
          </person-group>
          <article-title>Design and evaluation of a cloud-based Mobile Health Information Recommendation system on wireless sensor networks</article-title>
          <source>Comput Electr Eng</source>
          <year>2016</year>
          <month>01</month>
          <volume>49</volume>
          <fpage>221</fpage>
          <lpage>235</lpage>
          <pub-id pub-id-type="doi">10.1016/j.compeleceng.2015.07.017</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wiesner</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Pfeifer</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Health recommender systems: concepts, requirements, technical basics and challenges</article-title>
          <source>Int J Environ Res Public Health</source>
          <year>2014</year>
          <month>03</month>
          <volume>11</volume>
          <issue>3</issue>
          <fpage>2580</fpage>
          <lpage>2607</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.mdpi.com/resolver?pii=ijerph110302580"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/ijerph110302580</pub-id>
          <pub-id pub-id-type="medline">24595212</pub-id>
          <pub-id pub-id-type="pii">ijerph110302580</pub-id>
          <pub-id pub-id-type="pmcid">PMC3968965</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Agapito</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Simeoni</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Calabrese</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Caré</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Lamprinoudi</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Guzzi</surname>
              <given-names>PH</given-names>
            </name>
            <name name-style="western">
              <surname>Pujia</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Fuiano</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Cannataro</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>DIETOS: A dietary recommender system for chronic diseases monitoring and management</article-title>
          <source>Comput Methods Programs Biomed</source>
          <year>2018</year>
          <month>01</month>
          <volume>153</volume>
          <fpage>93</fpage>
          <lpage>104</lpage>
          <pub-id pub-id-type="doi">10.1016/j.cmpb.2017.10.014</pub-id>
          <pub-id pub-id-type="medline">29157465</pub-id>
          <pub-id pub-id-type="pii">S0169-2607(16)30692-7</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>iDoctor: personalized and professionalized medical recommendations based on hybrid matrix factorization</article-title>
          <source>Futur Gener Comput Syst</source>
          <year>2017</year>
          <month>01</month>
          <volume>66</volume>
          <fpage>30</fpage>
          <lpage>35</lpage>
          <pub-id pub-id-type="doi">10.1016/j.future.2015.12.001</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rivero-Rodriguez</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Konstantinidis</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Sanchez-Bocanegra</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Fernandez-Luque</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>A health information recommender systemnriching YouTube health videos with Medline Plus information by the use of SnomedCT terms</article-title>
          <source>Proc 26th IEEE Int Symp Comput Based Med Syst</source>
          <year>2013</year>
          <pub-id pub-id-type="doi">10.1109/cbms.2013.6627798</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Manogaran</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Varatharajan</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Priyan</surname>
              <given-names>MK</given-names>
            </name>
          </person-group>
          <article-title>Hybrid recommendation system for heart disease diagnosis based on multiple kernel learning with adaptive neuro-fuzzy inference system</article-title>
          <source>Multimed Tools Appl</source>
          <year>2017</year>
          <month>12</month>
          <day>22</day>
          <volume>77</volume>
          <issue>4</issue>
          <fpage>4379</fpage>
          <lpage>4399</lpage>
          <pub-id pub-id-type="doi">10.1007/s11042-017-5515-y</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pincay</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Teran</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Portmann</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Health recommender systems: a state-of-the-art review</article-title>
          <year>2019</year>
          <conf-name>2019 Sixth International Conference on eDemocracy &#38; eGovernment (ICEDEG)</conf-name>
          <conf-date>2019</conf-date>
          <conf-loc>Quito</conf-loc>
          <fpage>47</fpage>
          <lpage>55</lpage>
          <pub-id pub-id-type="doi">10.1109/icedeg.2019.8734362</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Mao</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Recommender system application developments: a survey</article-title>
          <source>Decis Support Syst</source>
          <year>2015</year>
          <month>06</month>
          <volume>74</volume>
          <fpage>12</fpage>
          <lpage>32</lpage>
          <pub-id pub-id-type="doi">10.1016/j.dss.2015.03.008</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Burke</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Hybrid web recommender systems</article-title>
          <source>The Adaptive Web</source>
          <year>2007</year>
          <publisher-loc>Springer</publisher-loc>
          <publisher-name>Berlin</publisher-name>
          <fpage>377</fpage>
          <lpage>408</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ricci</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Rokach</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Shapira</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Introduction to recommender systems handbook</article-title>
          <source>Recommender Systems Handbook</source>
          <year>2011</year>
          <publisher-loc>Springer</publisher-loc>
          <publisher-name>Boston</publisher-name>
          <fpage>1</fpage>
          <lpage>35</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pazzani</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Billsus</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Content-based recommendation systems</article-title>
          <source>The Adaptive Web</source>
          <year>2007</year>
          <publisher-loc>Springer</publisher-loc>
          <publisher-name>Berlin</publisher-name>
          <fpage>325</fpage>
          <lpage>341</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Colombo-Mendoza</surname>
              <given-names>LO</given-names>
            </name>
            <name name-style="western">
              <surname>Valencia-García</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Rodríguez-González</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Alor-Hernández</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Samper-Zapater</surname>
              <given-names>JJ</given-names>
            </name>
          </person-group>
          <article-title>RecomMetz: a context-aware knowledge-based mobile recommender system for movie showtimes</article-title>
          <source>Expert Syst Appl</source>
          <year>2015</year>
          <month>02</month>
          <volume>42</volume>
          <issue>3</issue>
          <fpage>1202</fpage>
          <lpage>1222</lpage>
          <pub-id pub-id-type="doi">10.1016/j.eswa.2014.09.016</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shishehchi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Banihashem</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Mat</surname>
              <given-names>ZN</given-names>
            </name>
            <name name-style="western">
              <surname>Noah</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Ontological approach in knowledge based recommender system to develop the quality of e-learning system</article-title>
          <source>Aust J Basic Appl Sci</source>
          <year>2012</year>
          <volume>6</volume>
          <issue>2</issue>
          <fpage>115</fpage>
          <lpage>123</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Buder</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Schwind</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Learning with personalized recommender systems: a psychological view</article-title>
          <source>Comput Human Behav</source>
          <year>2012</year>
          <month>1</month>
          <volume>28</volume>
          <issue>1</issue>
          <fpage>207</fpage>
          <lpage>216</lpage>
          <pub-id pub-id-type="doi">10.1016/j.chb.2011.09.002</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tarus</surname>
              <given-names>JK</given-names>
            </name>
            <name name-style="western">
              <surname>Niu</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Mustafa</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Knowledge-based recommendation: a review of ontology-based recommender systems for e-learning</article-title>
          <source>Artif Intell Rev</source>
          <year>2017</year>
          <month>1</month>
          <day>13</day>
          <volume>50</volume>
          <issue>1</issue>
          <fpage>21</fpage>
          <lpage>48</lpage>
          <pub-id pub-id-type="doi">10.1007/s10462-017-9539-5</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Adomavicius</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Tuzhilin</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Toward the next generation of recommender systems: a survey of the state-of-the-art and possible extensions</article-title>
          <source>IEEE Trans Knowl Data Eng</source>
          <year>2005</year>
          <month>06</month>
          <volume>17</volume>
          <issue>6</issue>
          <fpage>734</fpage>
          <lpage>749</lpage>
          <pub-id pub-id-type="doi">10.1109/tkde.2005.99</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zeng</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Shen</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Rastegar-Mojarad</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Recommending education materials for diabetic questions using information retrieval approaches</article-title>
          <source>J Med Internet Res</source>
          <year>2017</year>
          <month>10</month>
          <day>16</day>
          <volume>19</volume>
          <issue>10</issue>
          <fpage>e342</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2017/10/e342/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/jmir.7754</pub-id>
          <pub-id pub-id-type="medline">29038097</pub-id>
          <pub-id pub-id-type="pii">v19i10e342</pub-id>
          <pub-id pub-id-type="pmcid">PMC5662791</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sanchez Bocanegra</surname>
              <given-names>CL</given-names>
            </name>
            <name name-style="western">
              <surname>Sevillano Ramos</surname>
              <given-names>JL</given-names>
            </name>
            <name name-style="western">
              <surname>Rizo</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Civit</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Fernandez-Luque</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>HealthRecSys: a semantic content-based recommender system to complement health videos</article-title>
          <source>BMC Med Inform Decis Mak</source>
          <year>2017</year>
          <month>5</month>
          <day>15</day>
          <volume>17</volume>
          <issue>1</issue>
          <pub-id pub-id-type="doi">10.1186/s12911-017-0431-7</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Duan</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Ji</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Ma</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Chi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Deng</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>An</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Using goal-directed design to create a mobile health app to improve patient compliance with hypertension self-management: development and deployment</article-title>
          <source>JMIR Mhealth Uhealth</source>
          <year>2020</year>
          <month>02</month>
          <day>25</day>
          <volume>8</volume>
          <issue>2</issue>
          <fpage>e14466</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://mhealth.jmir.org/2020/2/e14466/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/14466</pub-id>
          <pub-id pub-id-type="medline">32130161</pub-id>
          <pub-id pub-id-type="pii">v8i2e14466</pub-id>
          <pub-id pub-id-type="pmcid">PMC7064970</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dou</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Deng</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Guan</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Ji</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Du</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Duan</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Patients' acceptance of smartphone health technology for chronic disease management: a theoretical model and empirical test</article-title>
          <source>JMIR Mhealth Uhealth</source>
          <year>2017</year>
          <month>12</month>
          <day>06</day>
          <volume>5</volume>
          <issue>12</issue>
          <fpage>e177</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://mhealth.jmir.org/2017/12/e177/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/mhealth.7886</pub-id>
          <pub-id pub-id-type="medline">29212629</pub-id>
          <pub-id pub-id-type="pii">v5i12e177</pub-id>
          <pub-id pub-id-type="pmcid">PMC5738544</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Noy</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>McGuinness</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <source>Stanford Knowl Syst Lab</source>
          <year>2001</year>
          <access-date>2020-04-08</access-date>
          <comment>Ontology development 101: a guide to creating your first ontology<ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.ksl.stanford.edu/people/dlm/papers/ontology-tutorial-noy-mcguinness.pdf">http://www.ksl.stanford.edu/people/dlm/papers/ontology-tutorial-noy-mcguinness.pdf</ext-link>
                                                </comment>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Grüninger</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Fox</surname>
              <given-names>MS</given-names>
            </name>
          </person-group>
          <article-title>Methodology for the design and evaluation of ontologies</article-title>
          <year>1995</year>
          <conf-name>Int Jt Conf Artif Intel (IJCAI95), Work Basic Ontol Issues Knowl Shar</conf-name>
          <conf-date>1995</conf-date>
          <conf-loc>Montreal</conf-loc>
          <fpage>1</fpage>
          <lpage>10</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Horrocks</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Patel-Schneider</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Boley</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Tabet</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Grosof</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Dean</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <source>SWRL: a semantic web rule language combining OWL and RuleML</source>
          <year>2004</year>
          <access-date>2020-04-08</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.w3.org/Submission/SWRL/">https://www.w3.org/Submission/SWRL/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Salton</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Buckley</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Term-weighting approaches in automatic text retrieval</article-title>
          <source>Inf Process Manag</source>
          <year>1988</year>
          <month>1</month>
          <volume>24</volume>
          <issue>5</issue>
          <fpage>513</fpage>
          <lpage>523</lpage>
          <pub-id pub-id-type="doi">10.1016/0306-4573(88)90021-0</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mihalcea</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Tarau</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>TextRank: bringing order into texts</article-title>
          <year>2004</year>
          <conf-name>Proceedings of the 2004 Conference on Empirical Methods in Natural Language</conf-name>
          <conf-date>2004</conf-date>
          <conf-loc>Barcelona</conf-loc>
          <fpage>404</fpage>
          <lpage>411</lpage>
          <pub-id pub-id-type="doi">10.1016/0305-0491(73)90144-2</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mikolov</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Corrado</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Dean</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <source>Efficient estimation of word representations in vector space</source>
          <year>2013</year>
          <access-date>2020-04-08</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://arxiv.org/abs/1301.3781">http://arxiv.org/abs/1301.3781</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mikolov</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Corrado</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Dean</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <source>Advances in Neural Information Processing Systems</source>
          <year>2013</year>
          <access-date>2020-04-08</access-date>
          <comment>Distributed representations of words and phrases and their compositionality<ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/1310.4546">https://arxiv.org/abs/1310.4546</ext-link>
                                                </comment>
        </nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <source>Source code of the recommendation algorithm</source>
          <year>2019</year>
          <access-date>2020-04-08</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://github.com/xxwywzy/personalized-health-education">https://github.com/xxwywzy/personalized-health-education</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref49">
        <label>49</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Radim</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Sojka</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Software framework for topic modelling with large corpora</article-title>
          <year>2010</year>
          <conf-name>Proceedings of LREC 2010 workshop New Challenges for NLP Frameworks</conf-name>
          <conf-date>2010</conf-date>
          <conf-loc>Malta</conf-loc>
          <fpage>45</fpage>
          <lpage>50</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://is.muni.cz/publication/884893/en/Software-Framework-for-Topic-Modelling-with-Large-Corpora/Rehurek-Sojka"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref50">
        <label>50</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lamy</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Owlready: ontology-oriented programming in Python with automatic classification and high level constructs for biomedical ontologies</article-title>
          <source>Artif Intell Med</source>
          <year>2017</year>
          <month>07</month>
          <volume>80</volume>
          <fpage>11</fpage>
          <lpage>28</lpage>
          <pub-id pub-id-type="doi">10.1016/j.artmed.2017.07.002</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref51">
        <label>51</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kroenke</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Spitzer</surname>
              <given-names>RL</given-names>
            </name>
            <name name-style="western">
              <surname>Williams</surname>
              <given-names>JB</given-names>
            </name>
          </person-group>
          <article-title>The PHQ-9: validity of a brief depression severity measure</article-title>
          <source>J Gen Intern Med</source>
          <year>2001</year>
          <month>09</month>
          <volume>16</volume>
          <issue>9</issue>
          <fpage>606</fpage>
          <lpage>613</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://onlinelibrary.wiley.com/resolve/openurl?genre=article&#38;sid=nlm:pubmed&#38;issn=0884-8734&#38;date=2001&#38;volume=16&#38;issue=9&#38;spage=606"/>
          </comment>
          <pub-id pub-id-type="doi">10.1046/j.1525-1497.2001.016009606.x</pub-id>
          <pub-id pub-id-type="medline">11556941</pub-id>
          <pub-id pub-id-type="pii">jgi01114</pub-id>
          <pub-id pub-id-type="pmcid">PMC1495268</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref52">
        <label>52</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Craig</surname>
              <given-names>CL</given-names>
            </name>
            <name name-style="western">
              <surname>Marshall</surname>
              <given-names>AL</given-names>
            </name>
            <name name-style="western">
              <surname>Sjöström</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Bauman</surname>
              <given-names>AE</given-names>
            </name>
            <name name-style="western">
              <surname>Booth</surname>
              <given-names>ML</given-names>
            </name>
            <name name-style="western">
              <surname>Ainsworth</surname>
              <given-names>BE</given-names>
            </name>
            <name name-style="western">
              <surname>Pratt</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ekelund</surname>
              <given-names>U</given-names>
            </name>
            <name name-style="western">
              <surname>Yngve</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sallis</surname>
              <given-names>JF</given-names>
            </name>
            <name name-style="western">
              <surname>Oja</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>International physical activity questionnaire: 12-country reliability and validity</article-title>
          <source>Med Sci Sports Exerc</source>
          <year>2003</year>
          <month>08</month>
          <volume>35</volume>
          <issue>8</issue>
          <fpage>1381</fpage>
          <lpage>1395</lpage>
          <pub-id pub-id-type="doi">10.1249/01.MSS.0000078924.61453.FB</pub-id>
          <pub-id pub-id-type="medline">12900694</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref53">
        <label>53</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Cui</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <source>BioPortal: chronic disease patient education ontology</source>
          <access-date>2020-04-08</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://bioportal.bioontology.org/ontologies/CDPEO">http://bioportal.bioontology.org/ontologies/CDPEO</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref54">
        <label>54</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pearson</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>On lines and planes of closest fit to systems of points in space</article-title>
          <source>London Edinburgh Dublin Philos Mag J Sci</source>
          <year>1901</year>
          <volume>2</volume>
          <issue>11</issue>
          <fpage>559</fpage>
          <lpage>572</lpage>
          <pub-id pub-id-type="doi">10.1080/14786440109462720</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref55">
        <label>55</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hotelling</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Analysis of a complex of statistical variables into principal components</article-title>
          <source>J Educ Psychol</source>
          <year>1933</year>
          <volume>24</volume>
          <issue>7</issue>
          <fpage>498</fpage>
          <lpage>520</lpage>
          <pub-id pub-id-type="doi">10.1037/h0070888</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref56">
        <label>56</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Booth</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Haas</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>McCabe</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <source>W3C Working Group Note: web services architecture</source>
          <year>2004</year>
          <access-date>2020-04-08</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.w3.org/TR/2004/NOTE-ws-arch-20040211">https://www.w3.org/TR/2004/NOTE-ws-arch-20040211</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref57">
        <label>57</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Fan</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Keyword extraction based on tf/idf for Chinese news document</article-title>
          <source>Wuhan Univ J of Nat Sci</source>
          <year>2007</year>
          <month>9</month>
          <volume>12</volume>
          <issue>5</issue>
          <fpage>917</fpage>
          <lpage>921</lpage>
          <pub-id pub-id-type="doi">10.1007/s11859-007-0038-4</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref58">
        <label>58</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>MY</given-names>
            </name>
            <name name-style="western">
              <surname>Zheng</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Zheng</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>A hybrid keyword extraction method based on TF and semantic strategies for Chinese document</article-title>
          <source>Appl Mech Mater</source>
          <year>2014</year>
          <month>9</month>
          <volume>635-637</volume>
          <fpage>1476</fpage>
          <lpage>1479</lpage>
          <pub-id pub-id-type="doi">10.4028/www.scientific.net/amm.635-637.1476</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref59">
        <label>59</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Chinese document keyword extraction algorithm based on FP-growth</article-title>
          <year>2016</year>
          <conf-name>International Conference on Smart City and Systems Engineering (ICSCSE). IEEE</conf-name>
          <conf-date>2016</conf-date>
          <conf-loc>Hunan</conf-loc>
          <fpage>202</fpage>
          <lpage>205</lpage>
          <pub-id pub-id-type="doi">10.1109/icscse.2016.0062</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref60">
        <label>60</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Devlin</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Toutanova</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <source>BERT: pre-training of deep bidirectional transformers for language understanding</source>
          <year>2018</year>
          <access-date>2020-04-08</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://arxiv.org/abs/1810.04805">http://arxiv.org/abs/1810.04805</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref61">
        <label>61</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Dai</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Carbonell</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Salakhutdinov</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <source>XLNet: generalized autoregressive pretraining for language understanding</source>
          <year>2019</year>
          <access-date>2020-04-08</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://arxiv.org/abs/1906.08237">http://arxiv.org/abs/1906.08237</ext-link>
          </comment>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
