<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMI</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Med Inform</journal-id>
      <journal-title>JMIR Medical Informatics</journal-title>
      <issn pub-type="epub">2291-9694</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v8i7e16312</article-id>
      <article-id pub-id-type="pmid">32209527</article-id>
      <article-id pub-id-type="doi">10.2196/16312</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>A Multiview Model for Detecting the Inappropriate Use of Prescription Medication: Machine Learning Approach</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Eysenbach</surname>
            <given-names>Gunther</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Yang</surname>
            <given-names>Zhirong</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Aminbeidokhti</surname>
            <given-names>Amirhossein</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Zhuo</surname>
            <given-names>Lin</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-9188-702X</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Cheng</surname>
            <given-names>Yinchu</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-6084-0384</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Liu</surname>
            <given-names>Shaoqin</given-names>
          </name>
          <degrees>BA</degrees>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-8144-9042</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Yang</surname>
            <given-names>Yu</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff5" ref-type="aff">5</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-5611-8951</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Tang</surname>
            <given-names>Shuang</given-names>
          </name>
          <degrees>BA</degrees>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-2186-7503</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author">
          <name name-style="western">
            <surname>Zhen</surname>
            <given-names>Jiancun</given-names>
          </name>
          <degrees>MS</degrees>
          <xref rid="aff6" ref-type="aff">6</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-7402-2865</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author">
          <name name-style="western">
            <surname>Zhao</surname>
            <given-names>Junfeng</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-1268-5006</ext-link>
        </contrib>
        <contrib id="contrib8" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Zhan</surname>
            <given-names>Siyan</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Research Center of Clinical Epidemiology</institution>
            <institution>Peking University Third Hospital</institution>
            <addr-line>49 North Garden Rd, Haidian District</addr-line>
            <addr-line>Beijing, 100191</addr-line>
            <country>China</country>
            <phone>86 1082805162</phone>
            <email>siyan-zhan@bjmu.edu.cn</email>
          </address>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-7252-5349</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Research Center of Clinical Epidemiology</institution>
        <institution>Peking University Third Hospital</institution>
        <addr-line>Beijing</addr-line>
        <country>China</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Department of Epidemiology and Biostatistics</institution>
        <institution>School of Public Health</institution>
        <institution>Peking University</institution>
        <addr-line>Beijing</addr-line>
        <country>China</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Department of Pharmacy</institution>
        <institution>Peking University Third Hospital</institution>
        <addr-line>Beijing</addr-line>
        <country>China</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>School of Electronics Engineering and Computer Science</institution>
        <institution>Peking University</institution>
        <addr-line>Beijing</addr-line>
        <country>China</country>
      </aff>
      <aff id="aff5">
        <label>5</label>
        <institution>Center for Data Science in Medicine and Health</institution>
        <institution>Peking University</institution>
        <addr-line>Beijing</addr-line>
        <country>China</country>
      </aff>
      <aff id="aff6">
        <label>6</label>
        <institution>Department of Pharmacy</institution>
        <institution>Ji Shui Tan Hospital and Fourth Medical College of Peking University</institution>
        <addr-line>Beijing</addr-line>
        <country>China</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Siyan Zhan <email>siyan-zhan@bjmu.edu.cn</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <month>7</month>
        <year>2020</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>6</day>
        <month>7</month>
        <year>2020</year>
      </pub-date>
      <volume>8</volume>
      <issue>7</issue>
      <elocation-id>e16312</elocation-id>
      <history>
        <date date-type="received">
          <day>18</day>
          <month>9</month>
          <year>2019</year>
        </date>
        <date date-type="rev-request">
          <day>25</day>
          <month>11</month>
          <year>2019</year>
        </date>
        <date date-type="rev-recd">
          <day>18</day>
          <month>1</month>
          <year>2020</year>
        </date>
        <date date-type="accepted">
          <day>24</day>
          <month>3</month>
          <year>2020</year>
        </date>
      </history>
      <copyright-statement>©Lin Zhuo, Yinchu Cheng, Shaoqin Liu, Yu Yang, Shuang Tang, Jiancun Zhen, Junfeng Zhao, Siyan Zhan. Originally published in JMIR Medical Informatics (http://medinform.jmir.org), 06.07.2020.</copyright-statement>
      <copyright-year>2020</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Informatics, is properly cited. The complete bibliographic information, a link to the original publication on http://medinform.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://medinform.jmir.org/2020/7/e16312" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>The inappropriate use of prescription medication has recently garnered worldwide attention, but most national policies do not effectively provide for early detection or timely intervention.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>This study aimed to develop and assess the validity of a model that can detect the inappropriate use of prescription medication. This effort combines a multiview and topic matching method. The study also assessed the validity of this approach.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>A multiview extension of the latent Dirichlet allocation algorithm for topic modeling was chosen to generate diagnosis-medication topics, with data obtained from the Chinese Monitoring Network for Rational Use of Drugs (CMNRUD) database. Topic mapping allowed for calculating the degree to which diagnoses and medications were similarly distributed and, by setting a threshold, for identifying prescription misuse. The Beijing Regional Prescription Review Database (BRPRD) database was used as the gold standard to assess the model’s validity. We also conducted a sensitivity analysis using random samples of validated prescriptions and evaluated the model’s performance.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>A total of 44 million prescriptions were used to generate topics using the diagnoses and medications from the CMNRUD database. A random sample (15,000 prescriptions) from the BRPRD was used for validation, and it was found that the model had a sensitivity of 81.8%, specificity of 47.4%, positive-predictive value of 14.5%, and negative-predictive value of 96.0%. The model showed superior stability under different sampling proportions.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>A method that combines multiview topic modeling and topic matching can detect the inappropriate use of prescription medication. This model, which has mediocre specificity and moderate sensitivity, can be used as a primary screening tool and will likely complement and improve the process of manually reviewing prescriptions.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>inappropriate use of prescription medication</kwd>
        <kwd>topic model</kwd>
        <kwd>latent Dirichlet allocation</kwd>
        <kwd>multiview learning</kwd>
        <kwd>prescription review</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>It is estimated that more than 50% of medicines are inappropriately prescribed, dispensed, or sold, which represents a universal challenge for medical practice [<xref ref-type="bibr" rid="ref1">1</xref>]. Furthermore, in developing countries, the treatment of about 60% to 70% of patients in primary care does not meet standard treatment guidelines [<xref ref-type="bibr" rid="ref2">2</xref>]. This inappropriate use of prescription is wasteful and costly, and can increase the risk of adverse drug reactions [<xref ref-type="bibr" rid="ref3">3</xref>]. Finally, the overuse of antimicrobial and antibiotic injections may result in certain pathogens developing antibiotic resistance [<xref ref-type="bibr" rid="ref4">4</xref>].</p>
      <p>The excessive use of antibiotics is common in China, as is the injection of traditional Chinese medicines [<xref ref-type="bibr" rid="ref5">5</xref>-<xref ref-type="bibr" rid="ref7">7</xref>]. Antibiotics are present in 50% of prescriptions and injectable medicines in 30%, exceeding the World Health Organization’s standard treatment guidelines [<xref ref-type="bibr" rid="ref7">7</xref>]. The Chinese government released the <italic>Management Practices of Hospital Prescription Comment (Trial)</italic> in 2010 to assess compliance with rational criteria for using prescription drugs [<xref ref-type="bibr" rid="ref8">8</xref>]. This document requires that each hospital assign trained pharmacists monthly to review a minimum of 100 randomly sampled prescriptions. However, these reviews are currently associated with limited coverage, high omission rates, a lack of representativeness, and supervisory lag. All of this points to the urgency of improving the review process, especially when Chinese hospitals are witnessing a continuous daily increase in outpatient prescriptions [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref10">10</xref>].</p>
      <p>A few knowledge-based approaches have been implemented in the health care information systems (HISs) of Chinese hospitals to screen the appropriateness of prescriptions [<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref12">12</xref>]. Prior knowledge, including treatment guidelines, formularies, package inserts, expert knowledge, and published literature, indicates that these systems are generally working well. However, they are time-consuming and costly to establish and maintain [<xref ref-type="bibr" rid="ref13">13</xref>]. Furthermore, timely updates to these systems are challenging because of the continuous availability of both new drugs and new research.</p>
      <p>Currently, both supervised and unsupervised data-driven methodologies, whether as alternatives or supplements to the systems listed above, are being used to identify outliers and detect inappropriate prescriptions. Such approaches remain constrained, however, by the difficulty associated with using supervised methods to obtain high-quality labeled sample data [<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref15">15</xref>]. Other limiting factors include defining outliers and considering their association rules, which effectively account for the relationships between features [<xref ref-type="bibr" rid="ref16">16</xref>]. Usually, diagnosis and medication are closely and consistently related to the clinical condition of the patient. In the absence of this consistency, prescriptions are more likely to be inappropriate (or anomalous). Contextual anomaly detection is one approach to capture the relationship between features (eg, between medication and diagnosis) and to detect exceptions caused by feature mismatch [<xref ref-type="bibr" rid="ref17">17</xref>,<xref ref-type="bibr" rid="ref18">18</xref>]. Nonetheless, this does not work well with prescription data or similar information in a high-dimensional sparse space [<xref ref-type="bibr" rid="ref19">19</xref>].</p>
      <p>By contrast, a topic modeling method, the latent Dirichlet allocation (LDA) method [<xref ref-type="bibr" rid="ref20">20</xref>], has been proven to be useful in dimensional reduction when mining patient records [<xref ref-type="bibr" rid="ref21">21</xref>]. Here, a “topic” is defined as a collection of semantically related terms that appear frequently and relate to a common subject [<xref ref-type="bibr" rid="ref22">22</xref>]. LDA, a probabilistic statistical model with the assumption that topic distributions are drawn from their prior distributions, can be used to describe the composition of high-dimensional unstructured text and to capture clusters of words that reveal critical concepts [<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref23">23</xref>]. Beginning with its appearance in the biomedical domain, LDA has been used in mining clinical pathway patterns [<xref ref-type="bibr" rid="ref24">24</xref>-<xref ref-type="bibr" rid="ref26">26</xref>], image processing [<xref ref-type="bibr" rid="ref27">27</xref>-<xref ref-type="bibr" rid="ref29">29</xref>], risk stratification [<xref ref-type="bibr" rid="ref30">30</xref>], and bioinformatics [<xref ref-type="bibr" rid="ref31">31</xref>-<xref ref-type="bibr" rid="ref33">33</xref>]. One drawback of LDA is that it cannot simultaneously consider both diagnosis and medication. We therefore adopted a multiview [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref34">34</xref>-<xref ref-type="bibr" rid="ref36">36</xref>] concept that enhances the topic modeling capacity of LDA and coordinated it with anomaly detection techniques to build a multiview LDA model (MV-LDA). This model, which was tested in our previous simulation study, had a greater area under the precision-recall curve [<xref ref-type="bibr" rid="ref37">37</xref>] than the two traditional methods (point anomaly detection and contextual anomaly detection) and had better suitability for high-dimensional sparse data.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Data Sources</title>
        <p>One subsystem of the Chinese Monitoring Network for the Rational Use of Drugs (CMNRUD) was the data source for model development. The CMNRUD was launched by the Chinese Ministry of Health in 2010, and it covers over 86% (30/35) of the provinces in China [<xref ref-type="bibr" rid="ref38">38</xref>], including 60% of the nation’s tertiary hospitals (955 hospitals) and 6% of its secondary hospitals (375 hospitals) [<xref ref-type="bibr" rid="ref39">39</xref>]. Each monitoring hospital must upload encrypted data every month. The system organizes the prescriptions in a stipulated uniform structure, and thereafter, some of the cleaned data are checked by data management professionals. Since 2013, the system has been performing automatic uploading, preliminary cleaning, recoding, and verification.</p>
        <p>The CMNRUD consists of the following four monitoring subsystems: outpatient prescriptions, clinical drug use, medical damage, and critical disease. Anonymized data from outpatient prescriptions (from October to December 2016) were used to build the model for detecting prescription misuse. These data include demographic, diagnostic, and drug-related information. Diagnostic information includes the patient ID, diagnosis date, diagnosis description, and diagnostic code (10th revision of the International Classification of Diseases, ICD-10), which are directly related to the purpose of the patient’s visit or their condition. It sometimes may not include other complications that do not require further treatment. A higher diagnosis ranking was associated with more visit relevance. Available drug-related information (no more than five medications per prescription) includes information such as the prescription date, generic and brand names, corresponding Anatomical Therapeutic Chemical code, dosage, and administration route. The medications were listed randomly, preventing them from being mapped to the corresponding diagnoses on a one-to-one basis. The variables taken from the CMNRUD are presented in <xref ref-type="table" rid="table1">Table 1</xref>.</p>
        <p>The data for model validation were randomly selected from the Beijing Regional Prescription Review Database (BRPRD) [<xref ref-type="bibr" rid="ref40">40</xref>], which was created by the Beijing Municipal Administration of Hospitals in 2010. The BRPRD extracts 1 week of prescriptions every quarter from the HISs of 17 tertiary hospitals and five secondary hospitals in Beijing. A total of 19 hospitals from the BRPRD were included among the 65 CMNRUD monitoring hospitals from Beijing and accounted for 5.4% (19/349) of the hospitals in the entire CMNRUD database. The prescription variables include treatment type, prescription number, prescription date, age, sex, diagnosis, and medication. As part of the standard procedure, a prescription review board of trained clinicians and clinical pharmacists regularly examines the prescriptions individually based on a standardized guideline and then captures inappropriate data in the BRPRD database [<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref41">41</xref>].</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Main variables in the Chinese Monitoring Network for the Rational Use of Drugs outpatient prescription monitoring subsystem.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="250"/>
            <col width="750"/>
            <thead>
              <tr valign="top">
                <td>Information</td>
                <td>Variables<sup>a</sup></td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Basic information<break/>(patients)</td>
                <td>Patient ID, treatment card number, sex, age, and age range</td>
              </tr>
              <tr valign="top">
                <td>Basic information<break/>(hospital, department, and doctor)</td>
                <td>Hospital name, hospital grade, hospital type, region, department, and doctor ID</td>
              </tr>
              <tr valign="top">
                <td>Diagnosis</td>
                <td>Diagnosis name, and ICD-10<sup>b</sup> by class, suborder, and type</td>
              </tr>
              <tr valign="top">
                <td>Medication<sup>c</sup></td>
                <td>Prescription ID, prescription type, prescription date, ATC<sup>d</sup> code, drug trade name, drug generic name, specification, quantity, unit, dosage, usage, price, pharmaceutical company, and individual hospital information</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>The variables indicate the features of the multiview latent Dirichlet allocation model.</p>
            </fn>
            <fn id="table1fn2">
              <p><sup>b</sup>ICD-10: 10th revision of the International Classification of Diseases.</p>
            </fn>
            <fn id="table1fn3">
              <p><sup>c</sup>Since a generic medicine works the same as its branded version and owing to the limitation of the Anatomical Therapeutic Chemical’s lack of codes for traditional Chinese medicine, we used generic names, which are well recorded in the database, to build the topic model.</p>
            </fn>
            <fn id="table1fn4">
              <p><sup>d</sup>ATC: Anatomical Therapeutic Chemical.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Study Approval</title>
        <p>The Institutional Review Board of Peking University reviewed and approved the study protocol before the study commenced, and it determined that informed consent was not required (reference number: IRB00001052-17003-Exempt).</p>
      </sec>
      <sec>
        <title>Study Design</title>
        <p>We developed and evaluated an MV-LDA model for detecting the inappropriate use of prescription medications in the following four steps: (1) data preparation, gathering and cleaning data from the CMNRUD and BRPRD database; (2) topic generation, using MV-LDA topic-modeling methods and CMNRUD data to extract associations between diagnoses and medications; (3) inferring and anomaly scoring, using BRPRD data and the topics extracted in step 2 to infer the distribution of each prescription and measuring the degree to which diagnoses and medications show similar distributions (less similarity is associated with more likelihood that the item represents the inappropriate use of prescription medication); (4) model evaluation and sensitivity analysis, evaluating the model for detecting prescription misuse with the results of the BRPRD review.</p>
        <sec>
          <title>Step 1: Data Preparation</title>
          <p>Prescriptions between October 2016 and December 2016 from CMNRUD were used, and those with missing prescription identifiers or with medication withdrawal were excluded. The patient ID, treatment card number, prescription date, diagnosis name, and generic drug name were chosen to build the topics.</p>
          <p>For model evaluation, considering the sensitivity and specificity (71.5% and 68.8%, respectively) of the Apriori algorithm in previous work [<xref ref-type="bibr" rid="ref42">42</xref>,<xref ref-type="bibr" rid="ref43">43</xref>], we set both the expected sensitivity and specificity at 80%. By setting a significance level of .05 and an allowable error of 0.05, we needed at least 14,471 prescriptions given 1.7% prevalence [<xref ref-type="bibr" rid="ref44">44</xref>] of prescription misuse according to equation 1.</p>
          <p>
            <graphic xlink:href="medinform_v8i7e16312_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </p>
          <p>Finally, we randomly selected a total of 15,000 prescriptions from 2016 BRPRD data that had already been manually reviewed by experienced pharmacists, with the prescriptions that included the following three variables: prescription ID, diagnosis, and medication.</p>
        </sec>
        <sec>
          <title>Step 2: Topic Generation</title>
          <p>The study is based on the assumption that the prescription database is mostly composed of regular instances (ie, rational appropriate prescriptions), and a probabilistic model is fitted to all features.</p>
          <p>LDA assumes that a set of documents or instances exhibits a specific number of latent independent topics, and then, the given topics generate the terms probabilistically. A graphical representation of the LDA model is given in <xref rid="figure1" ref-type="fig">Figure 1</xref>. With specific input records and setting hyperparameters <italic>α</italic> and <italic>β</italic>, LDA can detect <italic>K</italic> topics, formally presented as two multinomial distributions (topic-word distribution <italic>φ</italic> and document-topic distribution <italic>θ</italic>). The LDA model formula is shown in equation 2.</p>
          <p>
            <graphic xlink:href="medinform_v8i7e16312_fig5.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </p>
          <p>Like the standard LDA, MV-LDA can be represented as a probability pattern, as shown in <xref rid="figure2" ref-type="fig">Figure 2</xref>. In the medical domain, we can consider a clinical condition (topic) as a probability distribution over related diagnostic codes, and a patient’s diagnostic record can be regarded as a “document” composed of different clinical topics. The same applies to medication. In our study, we used CMNRUD data to generate MV-LDA topics. For prescription <italic>m</italic>, features A and B represent the diagnoses and medications, respectively. Both follow the same generative process mentioned above (ie, they comply with the same topic distribution <italic>θ</italic>), and then, <italic>α</italic> and <italic>β</italic> become the hyperparameters of prescription-topic distribution and topic-diagnosis (or topic-medication) distribution within topics. Moreover, <italic>φ<sup>A</sup></italic> and <italic>φ<sup>B</sup></italic> represent the topic feature distribution of A and B, respectively. In summary, the MV-LDA model is a combination of two separate LDA models (here they are called <italic>f<sup>A</sup></italic> and <italic>f<sup>B</sup></italic>) integrated by the common distribution <italic>θ</italic>. In <xref rid="figure2" ref-type="fig">Figure 2</xref>, <italic>N<sup>A</sup></italic> and <italic>N<sup>B</sup></italic> are the total numbers of diagnoses and medications with each prescription; this value can only be a discrete integer.</p>
          <fig id="figure1" position="float">
            <label>Figure 1</label>
            <caption>
              <p>Graphical representation of the latent Dirichlet allocation model. K: number of topics; M: number of documents; N: number of words in each document; x: observed words in the document m; z: topic of nth word in a document m; θ: topic distribution for document m (document-topic distribution); φ: topic-word distribution; α: hyperparameter of θ; β: hyperparameter of φ.</p>
            </caption>
            <graphic xlink:href="medinform_v8i7e16312_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
          <fig id="figure2" position="float">
            <label>Figure 2</label>
            <caption>
              <p>Graphical representation of the multiview latent Dirichlet allocation model. K: number of topics; M: number of prescriptions; N<sup>A</sup>: number of diagnoses per prescription; N<sup>B</sup>: number of medications per prescription; x<sup>A</sup>: diagnosis (type A feature); x<sup>B</sup>: medication (type B feature); z<sup>A</sup>: topic of x<sup>A</sup>; z<sup>B</sup>: topic of x<sup>B</sup>; φ<sup>A</sup>: topic-diagnosis distribution; φ<sup>B</sup>: topic-medication distribution; β<sup>A</sup>: hyperparameter of φ<sup>A</sup>; β<sup>B</sup>: hyperparameter of φ<sup>B</sup>; θ: prescription-topic distribution; α: hyperparameter of θ.</p>
            </caption>
            <graphic xlink:href="medinform_v8i7e16312_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
          <p>The MV-LDA model generates topics as follows: (1) For each topic, draw features <italic>φ<sup>A</sup></italic>~<italic>Dirichlet(β<sup>A</sup>)</italic> and draw features <italic>φ<sup>B</sup></italic>~<italic>Dirichlet(β<sup>B</sup>)</italic>; (2) For each prescription, draw topic proportions <italic>θ~Dirichlet(α)</italic>; for each feature A, draw <italic>z<sub>m,n</sub>~Mult(θ<sub>m</sub>)</italic> and draw <italic>x<sub>m,n</sub>~Mult(φ<sub>z</sub><sup>A</sup>)</italic>; and for each feature B, repeat the steps for feature A.</p>
          <p>We adopted Gibbs sampling to create the model and parameters <italic>φ</italic> and <italic>θ</italic>. Topics were first randomly assigned to all of the features. Every diagnosis (type A feature) or medication (type B feature) in each prescription that corresponds to a topic is iteratively sampled. The calculation of the conditional probability of <italic>x<sup>A</sup></italic> is shown in equation 3, with the related notations shown in <xref ref-type="table" rid="table2">Table 2</xref>. Here, the first factor of equation 3 only accounts for the type A feature topic-diagnosis counts, whereas the second factor calculates the prescription-topic for all features. This formula also applies to type B features.</p>
          <p>The features of both types (A and B) were iteratively sampled for each prescription until the model converged. Thereafter, we utilized the result to calculate the parameters <italic>φ<sup>A</sup></italic> and <italic>φ<sup>B</sup></italic>, which are used for the inferring step, and <italic>φ<sup>A</sup></italic> can be calculated as in equation 4. We set eight topic numbers (15, 20, 25, 30, 35, 40, 45, and 50) and built the MV-LDA model according to previous research and a pilot study revealing that LDA had a moderate ability in terms of generating topics for electronic medical records with a topic number of around 30 [<xref ref-type="bibr" rid="ref45">45</xref>].</p>
          <p>
            <graphic xlink:href="medinform_v8i7e16312_fig6.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </p>
          <p>
            <graphic xlink:href="medinform_v8i7e16312_fig7.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </p>
          <table-wrap position="float" id="table2">
            <label>Table 2</label>
            <caption>
              <p>Notations of the multiview latent Dirichlet allocation model in Gibbs sampling.</p>
            </caption>
            <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
              <col width="200"/>
              <col width="800"/>
              <thead>
                <tr valign="top">
                  <td>Variable</td>
                  <td>Description</td>
                </tr>
              </thead>
              <tbody>
                <tr valign="top">
                  <td>
                    <italic>K</italic>
                  </td>
                  <td>Topic number</td>
                </tr>
                <tr valign="top">
                  <td>
                    <italic>V</italic>
                    <sup>A</sup>
                  </td>
                  <td>Number of diagnoses (type A feature)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <graphic xlink:href="medinform_v8i7e16312_fig8.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
                  </td>
                  <td>Number of times that <italic>x</italic><sup>A</sup> is assigned to topic <italic>k</italic></td>
                </tr>
                <tr valign="top">
                  <td>
                    <graphic xlink:href="medinform_v8i7e16312_fig9.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
                  </td>
                  <td>Number of times that any feature A is assigned to topic <italic>k</italic></td>
                </tr>
                <tr valign="top">
                  <td>
                    <graphic xlink:href="medinform_v8i7e16312_fig10.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
                  </td>
                  <td>Number of all features of prescription <italic>m</italic> (including both A and B) assigned to topic <italic>k</italic></td>
                </tr>
                <tr valign="top">
                  <td>
                    <graphic xlink:href="medinform_v8i7e16312_fig11.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
                  </td>
                  <td>All features in prescription <italic>m</italic></td>
                </tr>
              </tbody>
            </table>
          </table-wrap>
        </sec>
        <sec>
          <title>Step 3: Inferring and Anomaly Scoring</title>
          <p>In this step, a separate dataset was used for inferring 15,000 randomly sampled prescriptions from the BRPRD (2016) that had already been manually reviewed by experienced pharmacists. Each feature in the MV-LDA model can be treated as an independent LDA model and can be inferred separately. To be specific, for the MV-LDA model obtained in the previous learning step, <italic>φ<sup>A</sup></italic> can be used to detect the new prescriptions in question, but this only pertains to estimations of the topic distribution under feature A. The equation for this is as follows:</p>
          <p>
            <graphic xlink:href="medinform_v8i7e16312_fig12.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </p>
          <p>In this equation, <italic>φ<sub>x,k</sub><sup>A</sup></italic> is the value of the topic distribution under the circumstance of topic <italic>k</italic> and feature <italic>x</italic>. Finally, as in the topic generating step (step 2), we inferred the marginal <italic>θ</italic> based on the Gibbs sampling shown in equation 5, which indicated the proportion of feature A assigned to topic <italic>k</italic> for each prescription. Additionally, <inline-graphic xlink:href="medinform_v8i7e16312_fig15.png" xlink:type="simple" mimetype="image"/> is calculated under type B features. For each test prescription, both <inline-graphic xlink:href="medinform_v8i7e16312_fig14.png" xlink:type="simple" mimetype="image"/> and   <inline-graphic xlink:href="medinform_v8i7e16312_fig15.png" xlink:type="simple" mimetype="image"/> were inferred and used to calculate the anomaly score.</p>
          <p>
            <graphic xlink:href="medinform_v8i7e16312_fig13.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </p>
          <p>The assumption mentioned in step 2 is that the given order of diagnoses and prescribed medication should show consistency (ie, the values for <inline-graphic xlink:href="medinform_v8i7e16312_fig14.png" xlink:type="simple" mimetype="image"/> and <inline-graphic xlink:href="medinform_v8i7e16312_fig15.png" xlink:type="simple" mimetype="image"/> should be equal or close to each other), and if not, the prescription might be inappropriate. The similarity between <inline-graphic xlink:href="medinform_v8i7e16312_fig14.png" xlink:type="simple" mimetype="image"/> and <inline-graphic xlink:href="medinform_v8i7e16312_fig15.png" xlink:type="simple" mimetype="image"/> was measured using novel topic mapping (TM) methods [<xref ref-type="bibr" rid="ref46">46</xref>]. TM was performed in the following manner: we allocated topic feature distributions from the MV-LDA model for every diagnosis or medication before matching. First, high probability topics were tagged for each diagnosis. Thereafter, we similarly identified the most probable topics for each medication and added up the total. When a topic was not tagged, it was assigned an anomaly score of 1. Finally, the anomaly scores for each prescription were summed, and different thresholds were used to filter potentially inappropriate prescriptions.</p>
        </sec>
        <sec>
          <title>Step 4: Model Evaluation and Sensitivity Analysis</title>
          <p>The same prescriptions (15,000 randomly sampled prescriptions from the BRPRD in 2016) were inferred and detected by the MV-LDA model. <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> shows the confusion matrix of the screening test we used. The sensitivity, specificity, positive-predictive value (PPV), negative-predictive value (NPV), and Youden’s index were computed from the results to compare the assessments between the model and the experts and to identify the best performance parameter setting of TM. A sensitivity analysis was performed by randomly sampling 90%, 70%, 50%, 30%, and 10% of prescriptions from the evaluation data of the 15,000 prescriptions. The sensitivity, specificity, PPV, NPV, Youden’s index, and area under the receiver operating characteristic curve were compared. It should be noted that the overlap between training data and evaluation data was small enough to be ignored.</p>
        </sec>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Prescriptions</title>
        <p>A total of 44,325,065 prescriptions from 22 million patients (138,535,092 records) at 349 hospitals, including 286 tertiary and 63 secondary hospitals, were used in our topic modeling process. This included 5,653 types of medications and 22,643 diseases or conditions. In the validation dataset, there were 14,166 (94.4%) outpatient prescriptions and 834 (5.6%) emergency prescriptions. Of these, 13,524 (90.2%) prescriptions satisfied the appropriate criteria (marked as “appropriate”) and 1476 (9.8%) failed (marked as “inappropriate”).</p>
      </sec>
      <sec>
        <title>Multiview Latent Dirichlet Allocation Topic Generation Results</title>
        <p>By setting the topic parameters, we obtained eight topic models, all with commonly diagnosed diseases in clinical practice. For example, the model (<italic>K</italic>=30) included cardiovascular diseases, diabetes, chronic nephrosis, osteoporosis, and some respiratory infections. Regarding topic 27, hypertension had a 93.3% probability of appearing in this topic, and amlodipine, nifedipine, levamlodipine, and metoprolol had probabilities of 11.7%, 8.9%, 7.7%, and 6.1%, respectively. The top probability diagnoses in topic 23 were bronchitis, pneumonia, and bronchopneumonia, with the proportions of 55.6%, 21.8%, and 12.1%, respectively, whereas the corresponding medications were ambroxol (11.2%), budesonide (10.7%), azithromycin (9.9%), and terbutaline (6.2%). We also obtained topics related to gastrointestinal diseases and mental and dermal disorders. The details pertaining to the top 10 topics and their allocations are shown in <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>.</p>
        <p>After comparing the training results of the topic models with settings at <italic>K</italic>=15, 20, 25, 30, 35, 40, 45, and 50 for the training results, it was found that a smaller topic number was associated with a weaker relation between the topics on one side and diagnoses and medications on the other, which were likely to appear more dispersed and had a lower probability of appearing in a topic. As the set value of the number of topics increased, the ability to summarize the disease was enhanced, that is, the subject-feature distribution of topic learning became more concentrated, the feature became more likely to appear in the topic, and the proportions of diagnosis and medication tended to be uniform.</p>
      </sec>
      <sec>
        <title>Multiview Latent Dirichlet Allocation Evaluation Sensitivity Analysis Results</title>
        <p>The BRPRD sample data evaluated the MV-LDA model. The performance of the MV-LDA model is shown in  <xref rid="figure3" ref-type="fig">Figure 3</xref>. Each model showed higher specificity and NPV for some topics, with the NPV reaching more than 90%, and the sensitivity being the highest at a TM threshold of 1. As the threshold value declined, the sensitivity decreased, the specificity and PPV increased, and the NPV showed no relevant change. When the number of topics increased, the sensitivity increased greatly, but the specificity, PPV, and NPV changed little.</p>
        <p>Taking all factors (sensitivity, specificity, PPV, NPV, and Youden’s index) into consideration, we set a cutoff of ≥1 TM anomaly scoring as the threshold for our MV-LDA detection model. The results showed a high sensitivity of 81.8% and a moderate specificity of 47.4%, and the PPV and NPV were 14.5% and 96.0%, respectively. These findings indicate that under the best performance parameter setting, we can find 1208 of 1476 inappropriate prescriptions.</p>
        <p>Our model evaluation results revealed that the MV-LDA model had a better ability to detect inappropriate prescriptions when the TM threshold was set to 1. However, for a better understanding of the robustness of the results at this parameter setting, we performed a sensitivity analysis, repeating the experiments with separate sampling proportions of 90%, 70%, 50%, 30%, and 10%. <xref ref-type="table" rid="table3">Table 3</xref> presents the findings. There were no relevant differences between the two experiments.</p>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>Summary of the performance of multiview latent Dirichlet allocation model with TM detection methods under different thresholds. Horizontal axis: thresholds of TM methods (from 1 to 5). Vertical axis: percentage of SEN, SPE, PPV, and NPV. K: number of topics; NPV: negative-predictive value; PPV: positive-predictive value; SEN: sensitivity; SPE: specificity; TM: topic mapping.</p>
          </caption>
          <graphic xlink:href="medinform_v8i7e16312_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Sensitivity analysis for multiview latent Dirichlet allocation with topic mapping detection methods (threshold=1).</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="100"/>
            <col width="90"/>
            <col width="90"/>
            <col width="90"/>
            <col width="90"/>
            <col width="80"/>
            <col width="80"/>
            <col width="80"/>
            <col width="90"/>
            <col width="130"/>
            <col width="80"/>
            <thead>
              <tr valign="top">
                <td>Sampling proportion</td>
                <td>TP<sup>a</sup>, n (%)</td>
                <td>FP<sup>b</sup>, n (%)</td>
                <td>FN<sup>c</sup>, n (%)</td>
                <td>TN<sup>d</sup>, n (%)</td>
                <td>SEN<sup>e</sup> (%)</td>
                <td>SPE<sup>f</sup> (%)</td>
                <td>PPV<sup>g</sup> (%)</td>
                <td>NPV<sup>h</sup> (%)</td>
                <td>Youden’s index</td>
                <td>AUROC<sup>i</sup></td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>90%</td>
                <td>1073 (7.9)</td>
                <td>5752 (42.6)</td>
                <td>249 (1.8)</td>
                <td>6435 (47.6)</td>
                <td>81.2</td>
                <td>47.2</td>
                <td>14.3</td>
                <td>95.9</td>
                <td>14.3</td>
                <td>0.689</td>
              </tr>
              <tr valign="top">
                <td>70%</td>
                <td>823 (7.9)</td>
                <td>4446 (42.7)</td>
                <td>179 (1.7)</td>
                <td>4954 (47.6)</td>
                <td>82.1</td>
                <td>47.3</td>
                <td>14.2</td>
                <td>96.1</td>
                <td>14.2</td>
                <td>0.695</td>
              </tr>
              <tr valign="top">
                <td>50%</td>
                <td>570 (7.6)</td>
                <td>3235 (43.1)</td>
                <td>143 (1.9)</td>
                <td>3562 (47.4)</td>
                <td>79.9</td>
                <td>47.6</td>
                <td>13.8</td>
                <td>95.8</td>
                <td>13.8</td>
                <td>0.686</td>
              </tr>
              <tr valign="top">
                <td>30%</td>
                <td>383 (8.6)</td>
                <td>1958 (43.9)</td>
                <td>93 (2.1)</td>
                <td>2030 (45.5)</td>
                <td>80.5</td>
                <td>49.1</td>
                <td>15.9</td>
                <td>95.5</td>
                <td>15.9</td>
                <td>0.705</td>
              </tr>
              <tr valign="top">
                <td>10%</td>
                <td>109 (7.3)</td>
                <td>622 (41.9)</td>
                <td>21 (1.4)</td>
                <td>734 (49.4)</td>
                <td>83.8</td>
                <td>45.9</td>
                <td>12.9</td>
                <td>96.7</td>
                <td>12.9</td>
                <td>0.693</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table3fn1">
              <p><sup>a</sup>TP: true positive.</p>
            </fn>
            <fn id="table3fn2">
              <p><sup>b</sup>FP: false positive.</p>
            </fn>
            <fn id="table3fn3">
              <p><sup>c</sup>FN: false negative.</p>
            </fn>
            <fn id="table3fn4">
              <p><sup>d</sup>TN: true negative.</p>
            </fn>
            <fn id="table3fn5">
              <p><sup>e</sup>SEN: sensitivity.</p>
            </fn>
            <fn id="table3fn6">
              <p><sup>f</sup>SPE: specificity.</p>
            </fn>
            <fn id="table3fn7">
              <p><sup>g</sup>PPV: positive-predictive value.</p>
            </fn>
            <fn id="table3fn8">
              <p><sup>h</sup>NPV: negative-predictive value.</p>
            </fn>
            <fn id="table3fn9">
              <p><sup>i</sup>AUROC: area under the receiver operating characteristic curve.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>The study drew upon the data of almost 45 million prescriptions obtained from the CMNRUD database (between October and December 2016). It then used the MV-LDA combination of TM anomaly detection and LDA topic modeling to build a model for detecting the inappropriate use of prescription medication. The model had a sensitivity of 81.8% and a specificity of 47.4% with 45 topics, and it had an anomaly threshold of 1 and showed stability in the sensitivity analysis. The topics that were already built into our study included most disorders, and the topics that were generated included noncommunicable diseases, such as cardiovascular diseases, which appeared in the largest proportions, consistent with clinical practice. The model also accommodated the tendency for many disorders to be seen in winter. For instance, upper respiratory infections, fever, and acute bronchitis were determined to be highly probable in winter. It took only 3.5 hours to generate the topics and only seconds to detect an anomaly, much quicker than the system of manual review or knowledge-based prescription review.</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>The present work has several limitations. The MV-LDA model has more features than were used in this study, including usage, dosage, cost, and even laboratory test results, when available. Moreover, it was challenging to clean accessional variables from the data source. For example, there are multiple modes of recording dose packaging because the composition and dosage forms of medicines differ from each other. Because of the difficulties noted above, the first limitation is that our method ignored the medication’s usage and dosage and only addressed the medication itself when building the MV-LDA model and validating the results. Second, the current model is still not supported for indicating the specific medication but tells us which prescriptions do not comply with the prescription review criteria. Besides, limited by the failure to obtain a labeled training dataset, the current model is not able to classify prescription misuse by criteria, such as the absence of proper indications, violation of clinical guidelines, and misuse of dosage, and can only detect the appropriateness of prescriptions. This study is also limited by the diverse structure of the model training and evaluation database and a minor overlap between the datasets used. However, we thought that a minor overlap of the data might not be associated with a major change in the results. Meanwhile, the two databases showed a commonality in their treatment patterns, and this, in fact, could be a topic for exploratory research on methodology. While this study focused on the development of a model, in the future, we will address a diverse range of parameters to determine the most effective MV-LDA model for detecting prescription misuse.</p>
      </sec>
      <sec>
        <title>Comparison With Prior Work</title>
        <p>Studies, such as those encouraging regular medication review and introducing automated information systems [<xref ref-type="bibr" rid="ref47">47</xref>,<xref ref-type="bibr" rid="ref48">48</xref>], have been conducted with the aim of controlling the inappropriate use of medications in China. However, the increasing number of new drugs entering the market, delays in updating the databases, and insufficient knowledge of medications all raise the probability of nonideal use [<xref ref-type="bibr" rid="ref49">49</xref>]. Knowledge-based and experience-based software has relevant limitations, including efficiency constraints. However, data mining techniques are customizable and can identify inappropriate prescriptions. For example, association rule mining has been used to find inappropriate prescriptions by calculating the co-occurrence of medications and diseases, resulting in a sensitivity of 75.9% and a specificity of 89.5% [<xref ref-type="bibr" rid="ref42">42</xref>,<xref ref-type="bibr" rid="ref43">43</xref>]. These methods however do have disadvantages, including inefficiency in the generation of candidate item sets because they require vast data sources and the frequent scanning of databases.</p>
        <p>Furthermore, these methods often fail to explore latent structures and are prone to making spurious associations that can mislead clinical practitioners. Besides, in a previous study, a model combining natural language processing with guidelines based on expert knowledge was used to detect medication overuse, and it showed degrees of sensitivity and specificity that were similar to those in our study [<xref ref-type="bibr" rid="ref50">50</xref>]. Despite using different data sources and operating under diverse study conditions, we noted a higher sensitivity as compared with the association rule mining method. Although we failed to obtain a higher PPV, which is strongly related to the prevalence of inappropriate prescriptions, we think the MV-LDA model is suitable for preliminary screening and can be an alternative detection method, allowing clinical practice to flag potentially inappropriate prescriptions for manual review. Such a step could save a large amount of working time and reduce labor intensity.</p>
        <p>A topic model is a multiple machine learning method and is used to reveal the semantics in the body of the text. With its advantages of topic extraction and model expansibility, LDA has become a commonly used topic modeling method. It was first used to extract underlying semantics and was then optimized to become a robust means of text mining analysis for social media [<xref ref-type="bibr" rid="ref51">51</xref>-<xref ref-type="bibr" rid="ref53">53</xref>]. Recently, topic modeling methods, particularly LDA, have been used for both structured and unstructured clinical data [<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref54">54</xref>-<xref ref-type="bibr" rid="ref56">56</xref>]. Several studies have attempted to scale the efficiency of LDA’s topic generation. The symptom-herb-diagnosis topic model, which was proposed to determine the association between treatment with Chinese medicine and diabetes, can be used to find herbs to treat specific symptoms [<xref ref-type="bibr" rid="ref55">55</xref>]. Multiple-channel LDA [<xref ref-type="bibr" rid="ref57">57</xref>] focused on the support system for clinical decisions and based itself on a similar concept that the coupling of diagnoses and medications reflects the health status of patients at the time of seeing a doctor. However, we were not able to obtain a piece of well-recorded contextual information or additional information, but we could leverage two variables (diagnosis and medication) and realize the aim of the study. Besides, given the shortcomings of miscellaneous algorithms and more extended calculations of an LDA-based model, various measures were taken to improve the MV-LDA algorithm in our project, which is not the focus of this study. The multiview topic modeling approach used here has been previously tested in different languages [<xref ref-type="bibr" rid="ref34">34</xref>]. This allowed us to take both medications and diagnoses into consideration simultaneously. We leveraged these advantages and processed only half of the data used in a previous study to determine the association between diagnoses and medications for each prescription [<xref ref-type="bibr" rid="ref58">58</xref>]. Prescriptions in our study were considered the equivalent of articles in that previous study, reflecting the particular situation of those patients. The topics and their allocations were consistent with clinical practice, providing proof of the robustness of our method.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>Our MV-LDA model can train the distribution of diagnosis-medication topics from a large number of prescriptions and can detect the potentially inappropriate use of prescription medications when combined with the TM method. Considering its mediocre specificity and moderate sensitivity, this model can be used as a primary screening tool and will likely complement and improve manual review. The model still needs more extension of views (introduction of more variables) to make full use of the information in the prescription and further improve the ability to identify prescription misuse.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Confusion matrix of model evaluation (multiview latent Dirichlet allocation model versus experts).</p>
        <media xlink:href="medinform_v8i7e16312_app1.docx" xlink:title="DOCX File , 14 KB"/>
      </supplementary-material>
      <supplementary-material id="app2">
        <label>Multimedia Appendix 2</label>
        <p>Example results of multiview latent Dirichlet allocation topic modeling (K=30).</p>
        <media xlink:href="medinform_v8i7e16312_app2.docx" xlink:title="DOCX File , 25 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">BRPRD</term>
          <def>
            <p>Beijing Regional Prescription Review Database</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">CMNRUD</term>
          <def>
            <p>Chinese Monitoring Network for the Rational Use of Drugs</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">LDA</term>
          <def>
            <p>latent Dirichlet allocation</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">MV-LDA</term>
          <def>
            <p>multiview latent Dirichlet allocation</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">NPV</term>
          <def>
            <p>negative-predictive value</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">PPV</term>
          <def>
            <p>positive-predictive value</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">TM</term>
          <def>
            <p>topic mapping</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>This work was supported by the National Natural Foundation of China (grant number 91646107) and the Beijing Municipal Science and Technology Project (grant number D151100002215002).</p>
    </ack>
    <fn-group>
      <fn fn-type="con">
        <p>LZ was the principal investigator for this study; she contributed to the design, analysis, and interpretation of the study. YY and YC contributed to the analysis and interpretation of data and provided clinical support. SL, ST, and JZ contributed to the model’s development. YH and JZ contributed to data extraction. LZ and YC drafted the manuscript. SZ provided overall supervision of the study and critically edited the manuscript. All authors reviewed the manuscript critically for scientific content, and all authors gave final approval of this version for publication.</p>
      </fn>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="web">
          <source>World Health Organization</source>
          <year>2004</year>
          <access-date>2019-11-14</access-date>
          <comment>World Medicines Situation<ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.who.int/medicines/areas/policy/world_medicines_situation/en/">https://www.who.int/medicines/areas/policy/world_medicines_situation/en/</ext-link>
                                                </comment>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Holloway</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Dijk</surname>
              <given-names>LV</given-names>
            </name>
          </person-group>
          <source>World Health Organization</source>
          <year>2011</year>
          <access-date>2019-10-12</access-date>
          <comment>The World Medicines Situation 2011: Rational Use of Medicines<ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.who.int/medicines/areas/policy/world_medicines_situation/WMS_ch14_wRational.pdf">https://www.who.int/medicines/areas/policy/world_medicines_situation/WMS_ch14_wRational.pdf</ext-link>
                                                </comment>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hamilton</surname>
              <given-names>HJ</given-names>
            </name>
            <name name-style="western">
              <surname>Gallagher</surname>
              <given-names>PF</given-names>
            </name>
            <name name-style="western">
              <surname>O'Mahony</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Inappropriate prescribing and adverse drug events in older people</article-title>
          <source>BMC Geriatr</source>
          <year>2009</year>
          <month>01</month>
          <day>28</day>
          <volume>9</volume>
          <fpage>5</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/19175914"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/1471-2318-9-5</pub-id>
          <pub-id pub-id-type="medline">19175914</pub-id>
          <pub-id pub-id-type="pii">1471-2318-9-5</pub-id>
          <pub-id pub-id-type="pmcid">PMC2642820</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lederberg</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Infectious history</article-title>
          <source>Science</source>
          <year>2000</year>
          <month>04</month>
          <day>14</day>
          <volume>288</volume>
          <issue>5464</issue>
          <fpage>287</fpage>
          <lpage>93</lpage>
          <pub-id pub-id-type="doi">10.1126/science.288.5464.287</pub-id>
          <pub-id pub-id-type="medline">10777411</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Reynolds</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>McKee</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Factors influencing antibiotic prescribing in China: an exploratory analysis</article-title>
          <source>Health Policy</source>
          <year>2009</year>
          <month>04</month>
          <volume>90</volume>
          <issue>1</issue>
          <fpage>32</fpage>
          <lpage>6</lpage>
          <pub-id pub-id-type="doi">10.1016/j.healthpol.2008.09.002</pub-id>
          <pub-id pub-id-type="medline">18849089</pub-id>
          <pub-id pub-id-type="pii">S0168-8510(08)00206-6</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Song</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Bian</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Petzold</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Yin</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>The impact of China's national essential medicine system on improving rational drug use in primary health care facilities: an empirical study in four provinces</article-title>
          <source>BMC Health Serv Res</source>
          <year>2014</year>
          <month>10</month>
          <day>25</day>
          <volume>14</volume>
          <fpage>507</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmchealthservres.biomedcentral.com/articles/10.1186/s12913-014-0507-3"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12913-014-0507-3</pub-id>
          <pub-id pub-id-type="medline">25344413</pub-id>
          <pub-id pub-id-type="pii">s12913-014-0507-3</pub-id>
          <pub-id pub-id-type="pmcid">PMC4213512</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Hou</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Fan</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Tong</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>Overprescribing in China, driven by financial incentives, results in very high use of antibiotics, injections, and corticosteroids</article-title>
          <source>Health Aff (Millwood)</source>
          <year>2012</year>
          <month>05</month>
          <volume>31</volume>
          <issue>5</issue>
          <fpage>1075</fpage>
          <lpage>82</lpage>
          <pub-id pub-id-type="doi">10.1377/hlthaff.2010.0965</pub-id>
          <pub-id pub-id-type="medline">22566449</pub-id>
          <pub-id pub-id-type="pii">31/5/1075</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="web">
          <source>Ministry of Health of the People's Republic of China</source>
          <year>2010</year>
          <access-date>2018-02-06</access-date>
          <comment>Management Practices of Hospital Prescription Comment (trial)<ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.gov.cn/gzdt/2010-03/04/content_1547080.htm">http://www.gov.cn/gzdt/2010-03/04/content_1547080.htm</ext-link>
                                                </comment>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Mei</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Influence of automated pharmacy system on waiting time in outpatient pharmacy</article-title>
          <source>Chinese Journal of Hospital Pharmacy (1)</source>
          <year>2014</year>
          <fpage>63</fpage>
          <lpage>6</lpage>
          <pub-id pub-id-type="doi">10.13286/j.cnki.chinhosppharmacyj.2014.01.19</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="web">
          <source>Peking University Third Hospital</source>
          <year>2018</year>
          <access-date>2018-11-04</access-date>
          <comment>Outpatient pharmacy<ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.puh3.net.cn/yjk/ksbm/153254.shtml">https://www.puh3.net.cn/yjk/ksbm/153254.shtml</ext-link>
                                                </comment>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Gong</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Research of real-time review system of electronic prescriptions for putpatient and emergency in hospital</article-title>
          <source>Science Mosaic</source>
          <year>2016</year>
          <issue>5</issue>
          <fpage>33</fpage>
          <lpage>5</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gao</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Fu</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Zhong</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>Discussions on Problems about the Monitoring System for Rational Drug Use and Relevant Countermeasures</article-title>
          <source>China Pharmacy</source>
          <year>2015</year>
          <issue>22</issue>
          <fpage>3159</fpage>
          <lpage>61</lpage>
          <pub-id pub-id-type="doi">10.6039/j.issn.1001-0408.2015.22.42</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Meyer</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Ostrzinski</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Fredrich</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Havemann</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Krafczyk</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Hoffmann</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>Efficient data management in a large-scale epidemiology research project</article-title>
          <source>Comput Methods Programs Biomed</source>
          <year>2012</year>
          <month>09</month>
          <volume>107</volume>
          <issue>3</issue>
          <fpage>425</fpage>
          <lpage>35</lpage>
          <pub-id pub-id-type="doi">10.1016/j.cmpb.2010.12.016</pub-id>
          <pub-id pub-id-type="medline">21256617</pub-id>
          <pub-id pub-id-type="pii">S0169-2607(10)00319-6</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Peikari</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Salama</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Nofech-Mozes</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Martel</surname>
              <given-names>AL</given-names>
            </name>
          </person-group>
          <article-title>A Cluster-then-label Semi-supervised Learning Approach for Pathology Image Classification</article-title>
          <source>Sci Rep</source>
          <year>2018</year>
          <month>05</month>
          <day>08</day>
          <volume>8</volume>
          <issue>1</issue>
          <fpage>7193</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://dx.doi.org/10.1038/s41598-018-24876-0"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41598-018-24876-0</pub-id>
          <pub-id pub-id-type="medline">29739993</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41598-018-24876-0</pub-id>
          <pub-id pub-id-type="pmcid">PMC5940864</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Gallagher</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Loveday</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Connor</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wiles</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Detecting anomalies in controlled drug prescription data using probabilistic models</article-title>
          <year>2015</year>
          <conf-name>Australasian Conference on Artificial Life and Computational Intelligence</conf-name>
          <conf-date>February 5-7, 2015</conf-date>
          <conf-loc>Newcastle, NSW, Australia</conf-loc>
          <publisher-name>Springer, Cham</publisher-name>
          <fpage>337</fpage>
          <lpage>349</lpage>
          <pub-id pub-id-type="doi">10.1007/978-3-319-14803-8_26</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nirad</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Surendro</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Outlier detection using association rule mining for information quality improvement</article-title>
          <year>2017</year>
          <conf-name>International Conference on Recent Trends in Science, Engineering and Technology</conf-name>
          <conf-date>July 10-11, 2017</conf-date>
          <conf-loc>Bangkok, Thailand</conf-loc>
          <pub-id pub-id-type="doi">10.17758/eap.dir0717002</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Valko</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kveton</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Valizadegan</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Cooper</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Hauskrecht</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Conditional anomaly detection with soft harmonic functions</article-title>
          <year>2011</year>
          <conf-name>11th International Conference on Data Mining</conf-name>
          <conf-date>December 11-14, 2011</conf-date>
          <conf-loc>Vancouver, BC, Canada</conf-loc>
          <publisher-name>IEEE</publisher-name>
          <fpage>735</fpage>
          <lpage>743</lpage>
          <pub-id pub-id-type="doi">10.1109/icdm.2011.40</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Song</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Jermaine</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Ranka</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Conditional Anomaly Detection</article-title>
          <source>IEEE Trans Knowl Data Eng</source>
          <year>2007</year>
          <month>5</month>
          <volume>19</volume>
          <issue>5</issue>
          <fpage>631</fpage>
          <lpage>645</lpage>
          <pub-id pub-id-type="doi">10.1109/tkde.2007.1009</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jensen</surname>
              <given-names>PB</given-names>
            </name>
            <name name-style="western">
              <surname>Jensen</surname>
              <given-names>LJ</given-names>
            </name>
            <name name-style="western">
              <surname>Brunak</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Mining electronic health records: towards better research applications and clinical care</article-title>
          <source>Nat Rev Genet</source>
          <year>2012</year>
          <month>05</month>
          <day>02</day>
          <volume>13</volume>
          <issue>6</issue>
          <fpage>395</fpage>
          <lpage>405</lpage>
          <pub-id pub-id-type="doi">10.1038/nrg3208</pub-id>
          <pub-id pub-id-type="medline">22549152</pub-id>
          <pub-id pub-id-type="pii">nrg3208</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Blei</surname>
              <given-names>DM</given-names>
            </name>
            <name name-style="western">
              <surname>Ng</surname>
              <given-names>AY</given-names>
            </name>
            <name name-style="western">
              <surname>Jordan</surname>
              <given-names>MI</given-names>
            </name>
          </person-group>
          <article-title>Latent Dirichlet allocation</article-title>
          <source>J Mach Learn Res</source>
          <year>2003</year>
          <volume>3</volume>
          <issue>4-5</issue>
          <fpage>993</fpage>
          <lpage>1022</lpage>
          <pub-id pub-id-type="doi">10.1056/NEJM196803212781204</pub-id>
          <pub-id pub-id-type="medline">5637250</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Park</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Choi</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Cha</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Moon</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>Identifying prescription patterns with a topic model of diseases and medications</article-title>
          <source>J Biomed Inform</source>
          <year>2017</year>
          <volume>75</volume>
          <fpage>35</fpage>
          <lpage>47</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(17)30200-9"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2017.09.003</pub-id>
          <pub-id pub-id-type="medline">28958484</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(17)30200-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zeng</surname>
              <given-names>QT</given-names>
            </name>
            <name name-style="western">
              <surname>Redd</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Rindflesch</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Nebeker</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Synonym, topic model and predicate-based query expansion for retrieving clinical documents</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2012</year>
          <volume>2012</volume>
          <fpage>1050</fpage>
          <lpage>9</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/23304381"/>
          </comment>
          <pub-id pub-id-type="medline">23304381</pub-id>
          <pub-id pub-id-type="pmcid">PMC3540443</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shivashankar</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Srivathsan</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Ravindran</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Tendulkar</surname>
              <given-names>AV</given-names>
            </name>
          </person-group>
          <article-title>Multi-view methods for protein structure comparison using latent dirichlet allocation</article-title>
          <source>Bioinformatics</source>
          <year>2011</year>
          <month>07</month>
          <day>01</day>
          <volume>27</volume>
          <issue>13</issue>
          <fpage>i61</fpage>
          <lpage>8</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/21685102"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/bioinformatics/btr249</pub-id>
          <pub-id pub-id-type="medline">21685102</pub-id>
          <pub-id pub-id-type="pii">btr249</pub-id>
          <pub-id pub-id-type="pmcid">PMC3117356</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Dong</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Ji</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Gan</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Duan</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Discovery of clinical pathway patterns from event logs using probabilistic topic models</article-title>
          <source>J Biomed Inform</source>
          <year>2014</year>
          <month>02</month>
          <volume>47</volume>
          <fpage>39</fpage>
          <lpage>57</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(13)00144-5"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2013.09.003</pub-id>
          <pub-id pub-id-type="medline">24076435</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(13)00144-5</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Dong</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Ji</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>He</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Duan</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Incorporating comorbidities into latent treatment pattern mining for clinical pathways</article-title>
          <source>J Biomed Inform</source>
          <year>2016</year>
          <month>02</month>
          <volume>59</volume>
          <fpage>227</fpage>
          <lpage>39</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(15)00292-0"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2015.12.012</pub-id>
          <pub-id pub-id-type="medline">26719169</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(15)00292-0</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Xie</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Mining Patterns of Disease Progression: A Topic-Model-Based Approach</article-title>
          <source>Stud Health Technol Inform</source>
          <year>2016</year>
          <volume>228</volume>
          <fpage>354</fpage>
          <lpage>8</lpage>
          <pub-id pub-id-type="medline">27577403</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chong</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Blei</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>FF</given-names>
            </name>
          </person-group>
          <article-title>Simultaneous image classification and annotation</article-title>
          <year>2009</year>
          <conf-name>IEEE Conference on Computer Vision and Pattern Recognition</conf-name>
          <conf-date>June 20-25, 2009</conf-date>
          <conf-loc>Miami, FL, USA</conf-loc>
          <fpage>1903</fpage>
          <lpage>1910</lpage>
          <pub-id pub-id-type="doi">10.1109/cvpr.2009.5206800</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Ma</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Grimson</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Unsupervised activity perception by hierarchical bayesian models</article-title>
          <source>IEEE Trans Pattern Anal Mach Intell</source>
          <year>2009</year>
          <volume>31</volume>
          <issue>3</issue>
          <fpage>539</fpage>
          <lpage>55</lpage>
          <pub-id pub-id-type="doi">10.1109/cvpr.2007.383072</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Poldrack</surname>
              <given-names>RA</given-names>
            </name>
            <name name-style="western">
              <surname>Mumford</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Schonberg</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Kalar</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Barman</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Yarkoni</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Discovering relations between mind, brain, and mental disorders using topic mapping</article-title>
          <source>PLoS Comput Biol</source>
          <year>2012</year>
          <volume>8</volume>
          <issue>10</issue>
          <fpage>e1002707</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pcbi.1002707"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pcbi.1002707</pub-id>
          <pub-id pub-id-type="medline">23071428</pub-id>
          <pub-id pub-id-type="pii">PCOMPBIOL-D-12-00776</pub-id>
          <pub-id pub-id-type="pmcid">PMC3469446</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Dong</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Duan</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>A probabilistic topic model for clinical risk stratification from electronic health records</article-title>
          <source>J Biomed Inform</source>
          <year>2015</year>
          <month>12</month>
          <volume>58</volume>
          <fpage>28</fpage>
          <lpage>36</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(15)00197-5"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2015.09.005</pub-id>
          <pub-id pub-id-type="medline">26370451</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(15)00197-5</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Tsykin</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Goodall</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Green</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Identifying functional miRNA-mRNA regulatory modules with correspondence latent dirichlet allocation</article-title>
          <source>Bioinformatics</source>
          <year>2010</year>
          <month>12</month>
          <day>15</day>
          <volume>26</volume>
          <issue>24</issue>
          <fpage>3105</fpage>
          <lpage>11</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/20956247"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/bioinformatics/btq576</pub-id>
          <pub-id pub-id-type="medline">20956247</pub-id>
          <pub-id pub-id-type="pii">btq576</pub-id>
          <pub-id pub-id-type="pmcid">PMC2995118</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pivovarov</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Perotte</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Grave</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Angiolillo</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wiggins</surname>
              <given-names>CH</given-names>
            </name>
            <name name-style="western">
              <surname>Elhadad</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Learning probabilistic phenotypes from heterogeneous EHR data</article-title>
          <source>J Biomed Inform</source>
          <year>2015</year>
          <month>12</month>
          <volume>58</volume>
          <fpage>156</fpage>
          <lpage>165</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(15)00223-3"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2015.10.001</pub-id>
          <pub-id pub-id-type="medline">26464024</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(15)00223-3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Dong</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Yao</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>An overview of topic modeling and its current applications in bioinformatics</article-title>
          <source>Springerplus</source>
          <year>2016</year>
          <volume>5</volume>
          <issue>1</issue>
          <fpage>1608</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/27652181"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s40064-016-3252-8</pub-id>
          <pub-id pub-id-type="medline">27652181</pub-id>
          <pub-id pub-id-type="pii">3252</pub-id>
          <pub-id pub-id-type="pmcid">PMC5028368</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Iwata</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Kashima</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Robust multi-view topic modeling by incorporating detecting anomalies</article-title>
          <year>2017</year>
          <conf-name>Joint European Conference on Machine Learning and Knowledge Discovery in Databases</conf-name>
          <conf-date>September 18-22, 2017</conf-date>
          <conf-loc>Skopje, Macedonia</conf-loc>
          <fpage>238</fpage>
          <lpage>250</lpage>
          <pub-id pub-id-type="doi">10.1007/978-3-319-71246-8_15</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>A survey of multi-view machine learning</article-title>
          <source>Neural Comput &#38; Applic</source>
          <year>2013</year>
          <month>2</month>
          <day>17</day>
          <volume>23</volume>
          <issue>7-8</issue>
          <fpage>2031</fpage>
          <lpage>2038</lpage>
          <pub-id pub-id-type="doi">10.1007/s00521-013-1362-6</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Tao</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>A survey on multi-view learning</article-title>
          <source>arXiv preprint</source>
          <year>2013</year>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/pdf/1304.5634.pdf"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Mei</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Hu</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Probabilistic-mismatch anomaly detection: do one’s medications match with the diagnoses</article-title>
          <year>2016</year>
          <conf-name>IEEE 16th International Conference on Data Mining (ICDM)</conf-name>
          <conf-date>December 12-15, 2016</conf-date>
          <conf-loc>Barcelona, Spain</conf-loc>
          <fpage>659</fpage>
          <lpage>668</lpage>
          <pub-id pub-id-type="doi">10.1109/icdm.2016.0077</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hu</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Establishment and application of Chineses monitoring network for the rational use of drugs system</article-title>
          <source>Exploration of Rational Drug Use in China</source>
          <year>2009</year>
          <volume>6</volume>
          <issue>8</issue>
          <fpage>5</fpage>
          <lpage>8</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Gao</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Xie</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Feng</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Zhan</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Evaluation of Electronic Healthcare Databases for Post-Marketing Drug Safety Surveillance and Pharmacoepidemiology in China</article-title>
          <source>Drug Saf</source>
          <year>2018</year>
          <month>01</month>
          <volume>41</volume>
          <issue>1</issue>
          <fpage>125</fpage>
          <lpage>137</lpage>
          <pub-id pub-id-type="doi">10.1007/s40264-017-0589-z</pub-id>
          <pub-id pub-id-type="medline">28815480</pub-id>
          <pub-id pub-id-type="pii">10.1007/s40264-017-0589-z</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhen</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Bian</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Kong</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Yan</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Effect evaluation of regional prescription review on rational clinical drug use</article-title>
          <source>Chinese Journal of Hospital Administration</source>
          <year>2015</year>
          <issue>7</issue>
          <fpage>531</fpage>
          <lpage>3</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="web">
          <source>Ministry of Health of the People's Republic of China</source>
          <access-date>2019-11-08</access-date>
          <comment>Prescription Administrative Policy 2007<ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.gov.cn/flfg/2007-03/13/content_549406.htm">http://www.gov.cn/flfg/2007-03/13/content_549406.htm</ext-link>
                                                </comment>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nguyen</surname>
              <given-names>PA</given-names>
            </name>
            <name name-style="western">
              <surname>Syed-Abdul</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Iqbal</surname>
              <given-names>U</given-names>
            </name>
            <name name-style="western">
              <surname>Hsu</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Clinciu</surname>
              <given-names>DL</given-names>
            </name>
            <name name-style="western">
              <surname>Jian</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>A probabilistic model for reducing medication errors</article-title>
          <source>PLoS One</source>
          <year>2013</year>
          <volume>8</volume>
          <issue>12</issue>
          <fpage>e82401</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pone.0082401"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0082401</pub-id>
          <pub-id pub-id-type="medline">24312659</pub-id>
          <pub-id pub-id-type="pii">PONE-D-13-25201</pub-id>
          <pub-id pub-id-type="pmcid">PMC3849453</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Iqbal</surname>
              <given-names>U</given-names>
            </name>
            <name name-style="western">
              <surname>Nguyen</surname>
              <given-names>PA</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Jian</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>An automated technique to identify potential inappropriate traditional Chinese medicine (TCM) prescriptions</article-title>
          <source>Pharmacoepidemiol Drug Saf</source>
          <year>2016</year>
          <month>04</month>
          <volume>25</volume>
          <issue>4</issue>
          <fpage>422</fpage>
          <lpage>30</lpage>
          <pub-id pub-id-type="doi">10.1002/pds.3976</pub-id>
          <pub-id pub-id-type="medline">26910512</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Prescription review and inappropriate prescription analysis in our hospital in 2013</article-title>
          <source>Chinese Medical Science</source>
          <year>2014</year>
          <issue>16</issue>
          <fpage>129</fpage>
          <lpage>31</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>DC</given-names>
            </name>
            <name name-style="western">
              <surname>Thermeau</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Chute</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Discovering associations among diagnosis groups using topic modeling</article-title>
          <source>AMIA Jt Summits Transl Sci Proc</source>
          <year>2014</year>
          <volume>2014</volume>
          <fpage>43</fpage>
          <lpage>9</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/25954576"/>
          </comment>
          <pub-id pub-id-type="medline">25954576</pub-id>
          <pub-id pub-id-type="pmcid">PMC4419765</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zhuo</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>An extended topic model based abnormal medical prescription detection method</article-title>
          <year>2018</year>
          <conf-name>National Conference on Pervasive Computing</conf-name>
          <conf-date>September 14-16, 2018</conf-date>
          <conf-loc>Tianjin, China</conf-loc>
        </nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="web">
          <source>World Health Organization</source>
          <year>2016</year>
          <access-date>2020-04-24</access-date>
          <comment>Medication Errors: Technical Series on Safer Primary Care<ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://apps.who.int/iris/bitstream/handle/10665/252274/9789241511643-eng.pdf?sequence=1">https://apps.who.int/iris/bitstream/handle/10665/252274/9789241511643-eng.pdf?sequence=1</ext-link>
                                                </comment>
        </nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Velo</surname>
              <given-names>GP</given-names>
            </name>
            <name name-style="western">
              <surname>Minuz</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Medication errors: prescribing faults and prescription errors</article-title>
          <source>Br J Clin Pharmacol</source>
          <year>2009</year>
          <month>06</month>
          <volume>67</volume>
          <issue>6</issue>
          <fpage>624</fpage>
          <lpage>8</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1111/j.1365-2125.2009.03425.x"/>
          </comment>
          <pub-id pub-id-type="doi">10.1111/j.1365-2125.2009.03425.x</pub-id>
          <pub-id pub-id-type="medline">19594530</pub-id>
          <pub-id pub-id-type="pii">BCP3425</pub-id>
          <pub-id pub-id-type="pmcid">PMC2723200</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref49">
        <label>49</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yuan</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Reasons of irrational drug use in medical institutions and its countermeasures: a case study of irrational drug use in department of gastroenterology</article-title>
          <source>Medicine and Philosophy</source>
          <year>2015</year>
          <volume>36</volume>
          <issue>15</issue>
          <fpage>51</fpage>
          <lpage>53</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref50">
        <label>50</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Salmasian</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Freedberg</surname>
              <given-names>DE</given-names>
            </name>
            <name name-style="western">
              <surname>Abrams</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Friedman</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>An automated tool for detecting medication overuse based on the electronic health records</article-title>
          <source>Pharmacoepidemiol Drug Saf</source>
          <year>2013</year>
          <month>02</month>
          <volume>22</volume>
          <issue>2</issue>
          <fpage>183</fpage>
          <lpage>9</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/23233423"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/pds.3387</pub-id>
          <pub-id pub-id-type="medline">23233423</pub-id>
          <pub-id pub-id-type="pmcid">PMC3566345</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref51">
        <label>51</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Jiang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Weng</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>He</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Lim</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Yan</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>X</given-names>
            </name>
          </person-group>
          <article-title>Comparing twitter and traditional media using topic models</article-title>
          <year>2011</year>
          <conf-name>European Conference on Information Retrieval</conf-name>
          <conf-date>April 18-21, 2011</conf-date>
          <conf-loc>Dublin, Ireland</conf-loc>
          <fpage>338</fpage>
          <lpage>349</lpage>
          <pub-id pub-id-type="doi">10.1007/978-3-642-20161-5_34</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref52">
        <label>52</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Xianghua</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Guo</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Yanyan</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Zhiqiang</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>Multi-aspect sentiment analysis for Chinese online social reviews based on topic modeling and HowNet lexicon</article-title>
          <source>Knowledge-Based Systems</source>
          <year>2013</year>
          <month>1</month>
          <volume>37</volume>
          <issue>2</issue>
          <fpage>186</fpage>
          <lpage>195</lpage>
          <pub-id pub-id-type="doi">10.1016/j.knosys.2012.08.003</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref53">
        <label>53</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Guo</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Guo</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>Multi-aspect blog sentiment analysis based on LDA topic model and Hownet Lexicon</article-title>
          <year>2011</year>
          <conf-name>International Conference on Web Information Systems and Mining</conf-name>
          <conf-date>September 24-25, 2011</conf-date>
          <conf-loc>Taiyuan, China</conf-loc>
          <fpage>131</fpage>
          <lpage>138</lpage>
          <pub-id pub-id-type="doi">10.1007/978-3-642-23982-3_17</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref54">
        <label>54</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Xiahou</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>TCM clinic records data mining approaches based on weighted-LDA and multi-relationship LDA model</article-title>
          <source>Multimed Tools Appl</source>
          <year>2016</year>
          <month>4</month>
          <day>13</day>
          <volume>75</volume>
          <issue>22</issue>
          <fpage>14203</fpage>
          <lpage>14232</lpage>
          <pub-id pub-id-type="doi">10.1007/s11042-016-3363-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref55">
        <label>55</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Feng</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Topic model for Chinese medicine diagnosis and prescription regularities analysis: case on diabetes</article-title>
          <source>Chin J Integr Med</source>
          <year>2011</year>
          <month>04</month>
          <volume>17</volume>
          <issue>4</issue>
          <fpage>307</fpage>
          <lpage>13</lpage>
          <pub-id pub-id-type="doi">10.1007/s11655-011-0699-x</pub-id>
          <pub-id pub-id-type="medline">21509676</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref56">
        <label>56</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cohen</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Aviram</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Elhadad</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Elhadad</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Redundancy-aware topic modeling for patient record notes</article-title>
          <source>PLoS One</source>
          <year>2014</year>
          <volume>9</volume>
          <issue>2</issue>
          <fpage>e87555</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pone.0087555"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0087555</pub-id>
          <pub-id pub-id-type="medline">24551060</pub-id>
          <pub-id pub-id-type="pii">PONE-D-13-38704</pub-id>
          <pub-id pub-id-type="pmcid">PMC3923754</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref57">
        <label>57</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Wei</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Hsiao</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Modeling healthcare data using multiple-channel latent Dirichlet allocation</article-title>
          <source>J Biomed Inform</source>
          <year>2016</year>
          <month>04</month>
          <volume>60</volume>
          <fpage>210</fpage>
          <lpage>23</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1016/j.jbi.2016.02.003"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2016.02.003</pub-id>
          <pub-id pub-id-type="medline">26898516</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(16)00025-3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref58">
        <label>58</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nguyen</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Zhan</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>Multi-modal image annotation with multi-instance multi-label LDA</article-title>
          <year>2013</year>
          <conf-name>23rd International Joint Conference on Artificial Intelligence</conf-name>
          <conf-date>August 3-9, 2013</conf-date>
          <conf-loc>Beijing‚ China</conf-loc>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
