<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
    <front>
        <journal-meta>
            <journal-id journal-id-type="publisher-id">JMI</journal-id>
            <journal-id journal-id-type="nlm-ta">JMIR Med Inform</journal-id>
            <journal-title>JMIR Medical Informatics</journal-title>
            <issn pub-type="epub">2291-9694</issn>
            <publisher>
                <publisher-name>Gunther Eysenbach</publisher-name>
                <publisher-loc>JMIR Publications Inc., Toronto, Canada</publisher-loc>
            </publisher>
        </journal-meta>
        <article-meta>
            <article-id pub-id-type="publisher-id">v3i3e28</article-id>
            <article-id pub-id-type="pmid">26323593</article-id>
            <article-id pub-id-type="doi">10.2196/medinform.3982</article-id>
            <article-categories>
                <subj-group subj-group-type="heading">
                    <subject>Original Paper</subject>
                </subj-group>
                <subj-group subj-group-type="article-type">
                    <subject>Original Paper</subject>
                </subj-group>
            </article-categories>
            <title-group>
                <article-title>Using MEDLINE Elemental Similarity to Assist in the Article Screening Process for Systematic Reviews</article-title>
            </title-group>
            <contrib-group>
                <contrib contrib-type="editor">
                    <name>
                        <surname>Eysenbach</surname>
                        <given-names>Gunther</given-names>
                    </name>
                </contrib>
            </contrib-group>
            <contrib-group>
                <contrib contrib-type="reviewer">
                    <name>
                        <surname>Tsafnat</surname>
                        <given-names>Guy</given-names>
                    </name>
                </contrib>
                <contrib contrib-type="reviewer">
                    <name>
                        <surname>Dunn</surname>
                        <given-names>Adam</given-names>
                    </name>
                </contrib>
            </contrib-group>
            <contrib-group>
                <contrib contrib-type="author" id="contrib1">
                    <name name-style="western">
                        <surname>Ji</surname>
                        <given-names>Xiaonan</given-names>
                    </name>
                    <degrees>MS</degrees>
                    <xref rid="aff1" ref-type="aff">1</xref>
                    <ext-link ext-link-type="orcid">http://orcid.org/0000-0001-5337-5031</ext-link>
                </contrib>
                <contrib contrib-type="author" id="contrib2" corresp="yes">
                    <name name-style="western">
                        <surname>Yen</surname>
                        <given-names>Po-Yin</given-names>
                    </name>
                    <degrees>RN, PhD</degrees>
                    <xref rid="aff1" ref-type="aff">1</xref>
                    <address>
                        <institution>The Ohio State University</institution>
                        <institution>Department of Biomedical Informatics</institution>
                        <addr-line>1800 Canon Drive</addr-line>
                        <addr-line>Columbus, OH, </addr-line>
                        <country>United States</country>
                        <phone>1 503 889 6181</phone>
                        <email>po-yin.yen@osumc.edu</email>
                    </address>
                    <ext-link ext-link-type="orcid">http://orcid.org/0000-0002-7061-4185</ext-link>
                </contrib>
            </contrib-group>
            <aff id="aff1">
                <sup>1</sup>
                <institution>The Ohio State University</institution>
                <institution>Department of Biomedical Informatics</institution>
                <addr-line>Columbus, OH</addr-line>
                <country>United States</country>
            </aff>
            <author-notes>
                <corresp>Corresponding Author: Po-Yin Yen <email>po-yin.yen@osumc.edu</email>
                </corresp>
            </author-notes>
            <pub-date pub-type="collection">
                <season>Jul-Sep</season>
                <year>2015</year>
            </pub-date>
            <pub-date pub-type="epub">
                <day>31</day>
                <month>08</month>
                <year>2015</year>
            </pub-date>
            <volume>3</volume>
            <issue>3</issue>
            <elocation-id>e28</elocation-id>
            <!--history from ojs - api-xml-->
            <history>
                <date date-type="received">
                    <day>27</day>
                    <month>10</month>
                    <year>2014</year>
                </date>
                <date date-type="rev-request">
                    <day>25</day>
                    <month>2</month>
                    <year>2015</year>
                </date>
                <date date-type="rev-recd">
                    <day>22</day>
                    <month>4</month>
                    <year>2015</year>
                </date>
                <date date-type="accepted">
                    <day>24</day>
                    <month>5</month>
                    <year>2015</year>
                </date>
            </history>
            <!--(c) the authors - correct author names and publication date here if necessary. Date in form ', dd.mm.yyyy' after jmir.org-->
            <copyright-statement>&#169;Xiaonan Ji, Po-Yin Yen. Originally published in JMIR Medical Informatics (http://medinform.jmir.org), 31.08.2015. </copyright-statement>
            <copyright-year>2015</copyright-year>
            <license license-type="open-access" xlink:href="http://creativecommons.org/licenses/by/2.0/">
                <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (http://creativecommons.org/licenses/by/2.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Informatics, is properly cited. The complete bibliographic information, a link to the original publication on http://medinform.jmir.org/, as well as this copyright and license information must be included.</p>
            </license>
            <self-uri xlink:href="http://medinform.jmir.org/2015/3/e28/" xlink:type="simple" />
            <abstract>
                <sec sec-type="Background">
                    <title>Background</title>
                    <p>Systematic reviews and their implementation in practice provide high quality evidence for clinical practice but are both time and labor intensive due to the large number of articles. Automatic text classification has proven to be instrumental in identifying relevant articles for systematic reviews. Existing approaches use machine learning model training to generate classification algorithms for the article screening process but have limitations.</p>
                </sec>
                <sec sec-type="Objective">
                    <title>Objective</title>
                    <p>We applied a network approach to assist in the article screening process for systematic reviews using predetermined article relationships (similarity). The article similarity metric is calculated using the MEDLINE elements title (TI), abstract (AB), medical subject heading (MH), author (AU), and publication type (PT). We used an article network to illustrate the concept of article relationships. Using the concept, each article can be modeled as a node in the network and the relationship between 2 articles is modeled as an edge connecting them. The purpose of our study was to use the article relationship to facilitate an interactive article recommendation process.</p>
                </sec>
                <sec sec-type="Methods">
                    <title>Methods</title>
                    <p>We used 15 completed systematic reviews produced by the Drug Effectiveness Review Project and demonstrated the use of article networks to assist article recommendation. We evaluated the predictive performance of MEDLINE elements and compared our approach with existing machine learning model training approaches. The performance was measured by work saved over sampling at 95% recall (WSS95) and the F-measure (F<sub>1</sub>). We also used repeated analysis over variance and Hommel&#8217;s multiple comparison adjustment to demonstrate statistical evidence.</p>
                </sec>
                <sec sec-type="Results">
                    <title>Results</title>
                    <p>We found that although there is no significant difference across elements (except AU), TI and AB have better predictive capability in general. Collaborative elements bring performance improvement in both F<sub>1</sub> and WSS95. With our approach, a simple combination of TI+AB+PT could achieve a WSS95 performance of 37%, which is competitive to traditional machine learning model training approaches (23%-41% WSS95).</p>
                </sec>
                <sec sec-type="Conclusions">
                    <title>Conclusions</title>
                    <p>We demonstrated a new approach to assist in labor intensive systematic reviews. Predictive ability of different elements (both single and composited) was explored. Without using model training approaches, we established a generalizable method that can achieve a competitive performance.</p>
                </sec>
            </abstract>
            <kwd-group>
                <kwd>systematic review</kwd>
                <kwd>evidence-based medicine</kwd>
                <kwd>automatic document classification</kwd>
                <kwd>relevance feedback</kwd>
            </kwd-group>
        </article-meta>
    </front>
    <body>
        <sec sec-type="introduction">
            <title>Introduction</title>
            <p>Systematic reviews provide summaries of evidence from high quality studies to answer specific research questions. They are regularly used in health care [<xref ref-type="bibr" rid="ref1">1</xref>-<xref ref-type="bibr" rid="ref4">4</xref>] and for health policy making [<xref ref-type="bibr" rid="ref5">5</xref>]. Evidence-based medicine (EBM) relies heavily on the use of synthesized, up-to-date research evidence to make decisions. Systematic reviews are considered the highest quality source of evidence for EBM [<xref ref-type="bibr" rid="ref6">6</xref>]. However, systematic reviews require a series of very resource and time intensive steps [<xref ref-type="bibr" rid="ref4">4</xref>] that typically require several months to complete [<xref ref-type="bibr" rid="ref7">7</xref>]. Such workload and resource challenges can limit the tractability of an individual review, the ability to fund a review, and also the ability to respond to new evidence that may require an update to an existing review.</p>
            <p>MEDLINE is a biomedical literature database that stores and indexes a variety of relevant publications and is a primary resource for identifying studies for systematic reviews targeting the health sciences. However, the size of MEDLINE increases at a rate of over 12,000 articles per week, including reports related to over 300 randomized trials [<xref ref-type="bibr" rid="ref8">8</xref>]. The Cochrane Collaboration is an international organization dedicated to producing up-to-date systematic reviews, with more than 15,000 people participating in the work [<xref ref-type="bibr" rid="ref9">9</xref>]. According to The Cochrane Collaboration, more than 10,000 systematic reviews are needed for existing effectiveness research [<xref ref-type="bibr" rid="ref9">9</xref>]. In addition, a recent study reported that 23% of reviews require updates within 2 years [<xref ref-type="bibr" rid="ref10">10</xref>]. With the need to conduct a large amount of original and updated systematic reviews, it is essential to improve the efficiency of producing systematic reviews and their incumbent synthesized knowledge.</p>
            <p>A systematic review is commonly conducted by domain experts who are able to draft systematic review scopes, retrieve relevant citations, assess study quality, and synthesize evidence. The process can be broken down into 15 steps [<xref ref-type="bibr" rid="ref11">11</xref>]. Expert reviewers first identify the systematic review scope and research questions, and then generate search strategies to explore related databases (eg, MEDLINE). The search result is a list of citations usually organized in reference management software (eg, EndNote, RefWorks). Before synthesizing relevant evidence, expert reviewers need to classify articles based on the title and abstract. Then through the article screening (or article selection) process, relevant articles will proceed to the full-text level. In most systematic reviews, expert reviewers include a small portion ranging from 2% to 30% of citations at the title and abstract level; 1.6% to 27% get included at the full-text level [<xref ref-type="bibr" rid="ref7">7</xref>]. In other words, expert reviewers spend most of their effort excluding non-relevant or low quality studies. To accelerate this process, several machine learning approaches (ie, naive Bayes and support vector machine) [<xref ref-type="bibr" rid="ref7">7</xref>,<xref ref-type="bibr" rid="ref12">12</xref>-<xref ref-type="bibr" rid="ref15">15</xref>] were proposed to focus on facilitating and enhancing the title and abstract level triage, abstracts screening [<xref ref-type="bibr" rid="ref11">11</xref>], or article screening, which is crucial and time-consuming as it requires expert reviewers to screen a large amount of literature. The intelligent article selection process can be also called citation classification or citation screening.</p>
            <p>In this paper, we proposed to use established and predetermined article relationships and incorporate the concept of active machine learning to iteratively recommend articles and receive feedback from human reviewers. Although the idea of integrating human judgment sounds similar to the active learning approach implemented in Wallace&#8217;s work [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref14">14</xref>], our approach uses a different strategy. We do not formulate a classification model. Instead, we generate an article network representing the relationships between articles. We use the articles classified by human reviewers as a reference set to recommend the next similar article. There is no model trained during the recommendation procedure. The approach is similar to relevance feedback, a feature in some information retrieval systems. In general, users classify documents as relevant or irrelevant and provide the feedback to the information retrieval system. The information retrieval system then uses this information to retrieve documents similar to the relevant documents. Relevance feedback is commonly used as an automatic technique for queries modification. The process of relevance feedback is executed as a cycle of activity that refines queries in each iteration of feedback collection [<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref17">17</xref>].</p>
            <p>The predetermined relationships between articles can be conceptualized as an article network, which is different from the traditional citation network. A traditional citation network uses the <italic>citing</italic> and <italic>cited by</italic> of an article to build the network [<xref ref-type="bibr" rid="ref18">18</xref>]. We build article networks based on the similarity of any paired articles. Our similarity metric is calculated using data elements [<xref ref-type="bibr" rid="ref19">19</xref>] from an article, such as title, abstract, medical subject heading, author, and publication type. Under this concept, each article is modeled as a node in the network and the relationship (similarity) between two articles is modeled as an edge connecting them. Although the network method is not novel in the general document clustering area, we are the first to use the approach to facilitate systematic reviews and demonstrate its strength. <xref ref-type="fig" rid="figure1">Figure 1</xref> shows an illustrated network of a real systematic review (Urinary Incontinence) displayed in an aesthetically pleasing force-directed graphic layout. Theoretically, the network should be a complete graph in which every pair of articles has an edge representing the similarity between them. For visualization purposes, we eliminated the edges with lower similarity scores to provide a more human readable network.</p>
            <p>During our preliminary experiments, we found that a similarity score composed of all MEDLINE elements does not work well for every systematic review. We suspected that some elements (eg, title, abstract, publication type, MeSH, author) are better predictors for recommendations than others. Therefore, the purpose of our study was to answer two research questions. When an article is classified as included, what element(s) are better to use to calculate the similarity score to predict the next relevant article? Since every element plays a different role and should be weighted accordingly, what combinations and weights of elements are better to predict the next relevant article?</p>
            <fig id="figure1" position="float">
                <label>Figure 1</label>
                <caption>
                    <p>Illustrated article network.</p>
                </caption>
                <graphic xlink:href="medinform_v3i3e28_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple" />
            </fig>
        </sec>
        <sec sec-type="methods">
            <title>Methods</title>
            <sec>
                <title>Data Source</title>
                <p>To evaluate our approach, we used 15 publicly available completed systematic review samples produced by the Drug Effectiveness Review Project (DERP) (coordinated by the Center for Evidence-Based Policy at Oregon Health and Science University) [<xref ref-type="bibr" rid="ref20">20</xref>]. These 15 systematic reviews were completed by experienced and knowledgeable human expert reviewers, with inclusion and exclusion decisions made by at least two expert reviewers. <xref ref-type="table" rid="table1">Table 1</xref> shows the number and percentage of articles included at abstract level decision and full-text level decision.</p>
                <p>For instance, the review for ACE Inhibitors has a total of 2544 citations. Based on the abstracts, 183 (7.19%) were included; after full-text reading, 41 (1.61%) were included in the ACE Inhibitor systematic review. The final inclusion rates range from 0.78% to 27.04%. The 15 systematic reviews are also the same test collection previously used and made publicly available by Cohen et al [<xref ref-type="bibr" rid="ref7">7</xref>]. Using the PubMed Identifier (PMID), we downloaded the full record in MEDLINE format [<xref ref-type="bibr" rid="ref19">19</xref>] and extracted the data elements title, abstract, publication types, author and medical subject heading (MeSH) as the input.</p>
                <table-wrap position="float" id="table1">
                    <label>Table 1</label>
                    <caption>
                        <p>Total article numbers and rates of inclusion.</p>
                    </caption>
                    <table width="476" border="0" cellpadding="7" cellspacing="0" rules="groups" frame="hsides">
                        <col width="210" />
                        <col width="35" />
                        <col width="90" />
                        <col width="86" />
                        <thead>
                            <tr valign="top">
                                <td>SR report topic</td>
                                <td>Total</td>
                                <td>Abstract<break />n (%)</td>
                                <td>Full text<break />n (%)</td>
                            </tr>
                        </thead>
                        <tbody>
                            <tr valign="top">
                                <td>ACE inhibitors</td>
                                <td>2544</td>
                                <td>183 (7.19)</td>
                                <td>41(1.61)</td>
                            </tr>
                            <tr valign="top">
                                <td>ADHD</td>
                                <td>851</td>
                                <td>84 (9.87)</td>
                                <td>20 (2.35)</td>
                            </tr>
                            <tr valign="top">
                                <td>Antihistamines</td>
                                <td>310</td>
                                <td>92 (29.68)</td>
                                <td>16 (5.16)</td>
                            </tr>
                            <tr valign="top">
                                <td>Atypical antipsychotics</td>
                                <td>1120</td>
                                <td>363 (32.41)</td>
                                <td>146 (13.04)</td>
                            </tr>
                            <tr valign="top">
                                <td>Beta blockers</td>
                                <td>2072</td>
                                <td>302 (14.58)</td>
                                <td>42 (2.03)</td>
                            </tr>
                            <tr valign="top">
                                <td>Calcium channel blockers</td>
                                <td>1218</td>
                                <td>279 (22.91)</td>
                                <td>100 (8.21)</td>
                            </tr>
                            <tr valign="top">
                                <td>Estrogens</td>
                                <td>368</td>
                                <td>80 (21.74)</td>
                                <td>80 (21.74)</td>
                            </tr>
                            <tr valign="top">
                                <td>NSAIDS</td>
                                <td>393</td>
                                <td>88 (22.39)</td>
                                <td>41 (10.43)</td>
                            </tr>
                            <tr valign="top">
                                <td>Opioids</td>
                                <td>1915</td>
                                <td>48 (2.51)</td>
                                <td>15 (0.78)</td>
                            </tr>
                            <tr valign="top">
                                <td>Oral hypoglycemics</td>
                                <td>503</td>
                                <td>139 (27.63)</td>
                                <td>136 (27.04)</td>
                            </tr>
                            <tr valign="top">
                                <td>Proton pump inhibitors</td>
                                <td>1333</td>
                                <td>238 (17.85)</td>
                                <td>51 (3.83)</td>
                            </tr>
                            <tr valign="top">
                                <td>Skeletal muscle relaxants</td>
                                <td>1643</td>
                                <td>34 (2.07)</td>
                                <td>9 (0.55)</td>
                            </tr>
                            <tr valign="top">
                                <td>Statins</td>
                                <td>3465</td>
                                <td>173 (4.99)</td>
                                <td>85 (2.45)</td>
                            </tr>
                            <tr valign="top">
                                <td>Triptans</td>
                                <td>671</td>
                                <td>218 (32.49)</td>
                                <td>24 (3.58)</td>
                            </tr>
                            <tr valign="top">
                                <td>Urinary incontinence</td>
                                <td>327</td>
                                <td>78 (23.85)</td>
                                <td>40 (12.23)</td>
                            </tr>
                        </tbody>
                    </table>
                </table-wrap>
            </sec>
            <sec>
                <title>MEDLINE Elements</title>
                <p>MEDLINE elements are the fields in the MEDLINE format that document the major pieces of information of a publication (article) [<xref ref-type="bibr" rid="ref19">19</xref>]. The MEDLINE display format is used in PubMed MEDLINE records. As the most informative elements, title (TI), abstract (AB) and MeSH (MH) elements are widely used in related work to build feature spaces for machine learning algorithms. Publication type (PT) is also selected by some studies [<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref21">21</xref>] as it could be a key factor for inclusion or exclusion decisions. In our preliminary work, we found that author information also has some predictive value in the article screening process. Therefore, in this study, in addition to TI, AB, MH, and PT, we also included the author (AU) element in our experiments.</p>
            </sec>
            <sec>
                <title>Similarity Score</title>
                <p>We calculate the similarity score using cosine similarity [<xref ref-type="bibr" rid="ref22">22</xref>]. Cosine similarity is widely applied to text mining and measures the cosine of the angle between a pair of vectors. It reflects the degree of similarity based on the presence and frequency of words or terms in each text. For every pair of AUs, PTs, and MHs, we simply compared them by exact string matching, because a minor difference may completely alter the outcome. For example, even if two author names are very similar, they may be two different people. However, TI and AB are free text. To calculate the similarity between two TIs and between two ABs, we preprocessed TIs and ABs by removing some common words from the PubMed stop word list [<xref ref-type="bibr" rid="ref23">23</xref>] (eg, the, is, are) that appear frequently in text, stemming each word by the classic Porter Stemmer algorithm [<xref ref-type="bibr" rid="ref24">24</xref>]. This approach, named alphabetic features, also has been verified to be an effective method to represent an article [<xref ref-type="bibr" rid="ref25">25</xref>]. The resulting similarity score ranges from 0 to 1 for each element, where 0 indicates independence and 1 means exactly the same. In summary, the similarity score is the sum of the MEDLINE element similarities.</p>
            </sec>
            <sec>
                <title>Simulated Interactive Recommendation Process</title>
                <sec>
                    <title>Overview</title>
                    <p>In this study, there is no human reviewer in this experimental process. The interactive recommendation process is simulated using the 15 completed DERP systematic reviews.</p>
                    <p>After identifying a list of articles to be screened for a systematic review, the recommendation process starts with calculating the similarity scores of any pairs of articles. This process constructs the relationship of the articles and builds a conceptualized article network. The first recommended article is selected based on key questions and search strategies of the systematic review. Once a recommended article is classified as included (IN) or excluded (EX), an IN list and an EX list are created (in this study, we used completed systematic reviews, which have predetermined decisions to simulate this step). We then iteratively recommend relevant articles based on the similarity to the IN. Assuming V is the set of all articles and U is the set of articles that have never been recommended, U is defined as U=V&#8722;IN&#8722;EX. Therefore, the sum of similarity scores represents the similarity between an article v with article(s) x in IN (see <xref ref-type="fig" rid="figure2">Figure 2</xref>).</p>
                    <fig id="figure2" position="anchor">
                        <label>Figure 2</label>
                        <caption>
                            <p>Calculation of the similarity between articles.</p>
                        </caption>
                        <graphic xlink:href="medinform_v3i3e28_fig2.jpg" alt-version="no" mimetype="image" position="float" xlink:type="simple" />
                    </fig>
                    <p>In the formula, <italic>vx</italic> is a similarity vector representing the similarity of MEDLINE element(s) between x and v. The weight parameter <italic>w</italic> controls the contribution of each element similarity vector in the overall similarity score. We recommend articles with the highest overall similarity scores.</p>
                    <p>
                        <xref ref-type="fig" rid="figure3">Figure 3</xref> illustrates the simulated interactive recommendation process: (a) Process articles and extract data elements; (b) Calculate similarity scores (this will establish a conceptualized article network. Weight parameters are optional); (c) Recommend article(s) with the highest similarity to included articles list (in this simulation, one article is recommended per each round); (d) Human reviewers classify the recommended article as included or excluded (again, in this study, we used completed systematic review reports, which have predetermined decisions to simulate this step); (e) Create and update the included and excluded article list; Steps (c), (d), and (e) repeat until the article screening process is completed.</p>
                    <p>To evaluate our performance, we used two performance measures: work saved over sampling at 95% recall (WSS95) and F-measure. These measures are commonly used for evaluating similar work [<xref ref-type="bibr" rid="ref7">7</xref>,<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref15">15</xref>]. We also used repeated analysis of variance (ANOVA) and post hoc analysis with Hommel multiple comparison adjustment to further explore statistical evidences. Hommel&#8217;s method&#160;demonstrated type I error protection with good power and is considered a better approach than Bonferroni or Homl [<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref27">27</xref>].</p>
                    <fig id="figure3" position="float">
                        <label>Figure 3</label>
                        <caption>
                            <p>Simulated interactive recommendation process.</p>
                        </caption>
                        <graphic xlink:href="medinform_v3i3e28_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple" />
                    </fig>
                </sec>
                <sec>
                    <title>Work Saved Over Sampling at 95% Recall</title>
                    <p>WSS95 is a performance measure first proposed by Cohen [<xref ref-type="bibr" rid="ref7">7</xref>] to calculate the overall labor saving while maintaining the recall at 95%. This assumes that a recall higher than 0.95 is necessary for a document classification system. Precision should be as high as possible, as long as recall is at least 0.95. WSS95 is calculated with the equations in <xref ref-type="fig" rid="figure4">Figure 4</xref>.</p>
                    <p>TP is the number of true positive (relevant) articles, TN is the number of true negatives (irrelevant) articles, FN is the number of false negative (relevant) articles, and N is the total number of articles in each report.</p>
                    <fig id="figure4" position="anchor">
                        <label>Figure 4</label>
                        <caption>
                            <p>Formulas of precision, recall, and F<sub>1</sub>.</p>
                        </caption>
                        <graphic xlink:href="medinform_v3i3e28_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple" />
                    </fig>
                </sec>
                <sec>
                    <title>F-Measure</title>
                    <p>F-measure is a measure of information retrieval accuracy. It considers both precision and recall and commonly combines them into a weighted harmonic mean. When they are weighted equally, the balanced F-measure is also called F<sub>1</sub>, where it reaches its best value at 1 and the worst value at 0. As a general measure of accuracy, F<sub>1</sub> has been widely used in previous works for the evaluation of classification performance, such as Cohen 2006 [<xref ref-type="bibr" rid="ref7">7</xref>], Bekhuis 2010 [<xref ref-type="bibr" rid="ref28">28</xref>], Kastrin 2010 [<xref ref-type="bibr" rid="ref29">29</xref>], and Frunza 2010 [<xref ref-type="bibr" rid="ref30">30</xref>]. For our performance evaluation purposes, when we recommend one article each time, the immediate recall, precision, and F<sub>1</sub> are dynamically changed each time (see <xref ref-type="fig" rid="figure5">Figure 5</xref>).</p>
                    <p>Since F<sub>1</sub> is dynamically changed over time, we can detect the highest F<sub>1</sub> from the steepness of the performance curve. That means if the higher F<sub>1</sub> scores occur during the early stage of the recommendation process (ie, before 50% of articles are screened), we are more likely to save more workload (high accuracy). We use F<sub>1</sub> to help us evaluate how accurate and how quickly we can make recommendations on the relevant articles.</p>
                    <fig id="figure5" position="anchor">
                        <label>Figure 5</label>
                        <caption>
                            <p>Formulas of WSS and WSS95.</p>
                        </caption>
                        <graphic xlink:href="medinform_v3i3e28_fig5.png" alt-version="no" mimetype="image" position="float" xlink:type="simple" />
                    </fig>
                </sec>
            </sec>
        </sec>
        <sec sec-type="results">
            <title>Results</title>
            <sec>
                <title>Single Element Performance</title>
                <p>The single MEDLINE element performance results are shown in <xref ref-type="table" rid="table2">Table 2</xref>. TI gets the best average WSS95 performance (34.01%), followed by PT (33.41%), and AB (33.30%). MH has a much lower WSS95 than other elements (25.31%). AU receives 0% workload saved due to the dispersion among articles&#8217; authorship. If there is no authorship similarity between articles, we are not able to recommend relevant articles based solely on AU element. Using PT also brings good performance; we speculate it is a key consideration when conducting system reviews. However, repeated ANOVA shows that the WSS95 performances across TI, AB, PT, and MH are not statistically different (<italic>P</italic>=.079).</p>
                <table-wrap position="float" id="table2">
                    <label>Table 2</label>
                    <caption>
                        <p>Single element WSS95 performance.</p>
                    </caption>
                    <table width="499" border="0" cellpadding="7" cellspacing="0" rules="groups" frame="hsides">
                        <col width="173" />
                        <col width="46" />
                        <col width="58" />
                        <col width="46" />
                        <col width="34" />
                        <col width="58" />
                        <thead>
                            <tr valign="top">
                                <td>SR report topic</td>
                                <td>TI</td>
                                <td>AB</td>
                                <td>PT</td>
                                <td>AU</td>
                                <td>MH</td>
                            </tr>
                        </thead>
                        <tbody>
                            <tr valign="top">
                                <td>ACE inhibitors</td>
                                <td>76.49</td>
                                <td>71.07</td>
                                <td>33.22</td>
                                <td>0</td>
                                <td>47.37</td>
                            </tr>
                            <tr valign="top">
                                <td>ADHD</td>
                                <td>80.26</td>
                                <td>65.10</td>
                                <td>22.56</td>
                                <td>0</td>
                                <td>47.00</td>
                            </tr>
                            <tr valign="top">
                                <td>Antihistamines</td>
                                <td>13.55</td>
                                <td>15.81</td>
                                <td>32.58</td>
                                <td>0</td>
                                <td>2.58</td>
                            </tr>
                            <tr valign="top">
                                <td>Atypical antipsychotics</td>
                                <td>17.23</td>
                                <td>20.54</td>
                                <td>19.64</td>
                                <td>0</td>
                                <td>9.46</td>
                            </tr>
                            <tr valign="top">
                                <td>Beta blockers</td>
                                <td>44.74</td>
                                <td>49.95</td>
                                <td>43.77</td>
                                <td>0</td>
                                <td>28.67</td>
                            </tr>
                            <tr valign="top">
                                <td>Calcium channel blockers</td>
                                <td>19.38</td>
                                <td>16.34</td>
                                <td>18.64</td>
                                <td>0</td>
                                <td>20.94</td>
                            </tr>
                            <tr valign="top">
                                <td>Estrogens</td>
                                <td>29.35</td>
                                <td>29.08</td>
                                <td>17.93</td>
                                <td>0</td>
                                <td>38.59</td>
                            </tr>
                            <tr valign="top">
                                <td>NSAIDS</td>
                                <td>63.36</td>
                                <td>66.67</td>
                                <td>58.27</td>
                                <td>0</td>
                                <td>33.84</td>
                            </tr>
                            <tr valign="top">
                                <td>Opioids</td>
                                <td>8.30</td>
                                <td>9.82</td>
                                <td>37.23</td>
                                <td>0</td>
                                <td>6.48</td>
                            </tr>
                            <tr valign="top">
                                <td>Oral hypoglycemics</td>
                                <td>11.73</td>
                                <td>12.13</td>
                                <td>22.27</td>
                                <td>0</td>
                                <td>7.55</td>
                            </tr>
                            <tr valign="top">
                                <td>Proton pump inhibitors</td>
                                <td>43.74</td>
                                <td>15.60</td>
                                <td>35.48</td>
                                <td>0</td>
                                <td>20.56</td>
                            </tr>
                            <tr valign="top">
                                <td>Skeletal muscle relaxants</td>
                                <td>0</td>
                                <td>36.03</td>
                                <td>74.68</td>
                                <td>0</td>
                                <td>42.85</td>
                            </tr>
                            <tr valign="top">
                                <td>Statins</td>
                                <td>25.52</td>
                                <td>30.17</td>
                                <td>13.31</td>
                                <td>0</td>
                                <td>13.68</td>
                            </tr>
                            <tr valign="top">
                                <td>Triptans</td>
                                <td>45.60</td>
                                <td>42.47</td>
                                <td>28.17</td>
                                <td>0</td>
                                <td>33.23</td>
                            </tr>
                            <tr valign="top">
                                <td>Urinary incontinence</td>
                                <td>30.89</td>
                                <td>18.65</td>
                                <td>43.43</td>
                                <td>0</td>
                                <td>26.91</td>
                            </tr>
                            <tr valign="top">
                                <td>Average WSS95</td>
                                <td>34.01</td>
                                <td>33.30</td>
                                <td>33.41</td>
                                <td>0</td>
                                <td>25.31</td>
                            </tr>
                        </tbody>
                    </table>
                </table-wrap>
                <p>
                    <xref ref-type="table" rid="table3">Table 3</xref> shows the highest F<sub>1</sub> performance and corresponding timing during the recommendation process. When performance is good, the highest F<sub>1</sub> usually occurs during the early stage (discussed in the Methods section). We found that AB and PT gain the best F<sub>1</sub> (0.3683 and 0.3437, respectively); MH and TI have lower F<sub>1</sub> scores (0.3116 and 0.3039, respectively). Again, AU gets the worst F<sub>1</sub>, only 0.1365. We also examined the corresponding timing of the highest F<sub>1</sub>. We observed that the best F<sub>1</sub> value appears when 5% to 20% of articles are screened, which is at the early stage of recommendation. MEDLINE elements with higher F<sub>1</sub> scores and lower percentages of articles screened indicate high accuracy performance during the early stage of recommendation (eg, AB). We concluded that AB and PT bring the best early stage performance; in other words, the recommendation accuracy of AB and PT in the beginning is better than that of the other elements. However, repeated ANOVA shows that the F<sub>1</sub> performances across TI, AB, PT, and MH are not statistically different (<italic>P</italic>=.073). Pairwise comparison only finds significant difference between TI and AB (AU is not considered due to its inferior performance).</p>
                <table-wrap position="float" id="table3">
                    <label>Table 3</label>
                    <caption>
                        <p>Single element F<sub>1</sub> performance; percentage of articles screened at F<sub>1</sub>.</p>
                    </caption>
                    <table width="582" border="0" cellpadding="7" cellspacing="0" rules="groups" frame="hsides">
                        <col width="112" />
                        <col width="70" />
                        <col width="64" />
                        <col width="94" />
                        <col width="83" />
                        <col width="75" />
                        <thead>
                            <tr valign="top">
                                <td>SR report topic</td>
                                <td>TI<break />F<sub>1</sub> (%)</td>
                                <td>AB<break />F<sub>1</sub> (%)</td>
                                <td>PT<break />F<sub>1</sub> (%)</td>
                                <td>AU<break />F<sub>1</sub> (%)</td>
                                <td>MH<break />F<sub>1</sub> (%)</td>
                            </tr>
                        </thead>
                        <tbody>
                            <tr valign="top">
                                <td>ACE inhibitors</td>
                                <td>0.3444 (4)</td>
                                <td>0.3121 (4)</td>
                                <td>0.2182 (&#60;1)</td>
                                <td>0.1872 (6)</td>
                                <td>0.2368 (1)</td>
                            </tr>
                            <tr valign="top">
                                <td>ADHD</td>
                                <td>0.2885 (10)</td>
                                <td>0.3824 (6)</td>
                                <td>0.2963 (&#60;1)</td>
                                <td>0.0909 (&#60;1)</td>
                                <td>0.5556 (4)</td>
                            </tr>
                            <tr valign="top">
                                <td>Antihistamines</td>
                                <td>0.2593 (12)</td>
                                <td>0.4000 (3)</td>
                                <td>0.2759 (&#60;1)</td>
                                <td>0.1111 (&#60;1)</td>
                                <td>0.3333 (3)</td>
                            </tr>
                            <tr valign="bottom">
                                <td>Atypical antipsychotics</td>
                                <td>0.3447 (26)</td>
                                <td>0.4248 (14)</td>
                                <td>0.4363 (5, 12<sup>a</sup>)</td>
                                <td>0.0135 (&#60;1)</td>
                                <td>0.3113 (40)</td>
                            </tr>
                            <tr valign="top">
                                <td>Beta blockers</td>
                                <td>0.1972 (1)</td>
                                <td>0.2710 (5)</td>
                                <td>0.2105 (&#60;1)</td>
                                <td>0.0417 (&#60;1)</td>
                                <td>0.0957 (19)</td>
                            </tr>
                            <tr valign="top">
                                <td>Calcium channel<break />blockers</td>
                                <td>0.2026 (10)</td>
                                <td>0.2672 (11)</td>
                                <td>0.2662 (15)</td>
                                <td>0.1261 (9)</td>
                                <td>0.2579 (2)</td>
                            </tr>
                            <tr valign="top">
                                <td>Estrogens</td>
                                <td>0.5140 (36)</td>
                                <td>0.5612 (29)</td>
                                <td>0.4937 (18)</td>
                                <td>0.0244 (&#60;1)</td>
                                <td>0.5536 (39)</td>
                            </tr>
                            <tr valign="top">
                                <td>NSAIDS</td>
                                <td>0.4368 (34)</td>
                                <td>0.5870 (13)</td>
                                <td>0.6761 (8)</td>
                                <td>0.4853 (24)</td>
                                <td>0.3650 (24)</td>
                            </tr>
                            <tr valign="top">
                                <td>Opioids</td>
                                <td>0.2727 (&#60;1)</td>
                                <td>0.1429 (&#60;1)</td>
                                <td>0.2222 (&#60;1)</td>
                                <td>0.1111 (&#60;1)</td>
                                <td>0.2500 (&#60;1)</td>
                            </tr>
                            <tr valign="top">
                                <td>Oral hypoglycemics</td>
                                <td>0.4509 (88)</td>
                                <td>0.4603 (76)</td>
                                <td>0.5019 (78)</td>
                                <td>0.0145 (&#60;1)</td>
                                <td>0.4527 (53)</td>
                            </tr>
                            <tr valign="top">
                                <td>Proton pump<break />inhibitors</td>
                                <td>0.3333 (1)</td>
                                <td>0.3860 (5)</td>
                                <td>0.1299 (42)</td>
                                <td>0.0377 (&#60;1)</td>
                                <td>0.1775 (25)</td>
                            </tr>
                            <tr valign="top">
                                <td>Skeletal muscle<break />relaxants</td>
                                <td>0.1429 (&#60;1)</td>
                                <td>0.1981 (&#60;1)</td>
                                <td>0.2286 (2)</td>
                                <td>0.1429 (&#60;1)</td>
                                <td>0.2222 (&#60;1)</td>
                            </tr>
                            <tr valign="top">
                                <td>Statins</td>
                                <td>0.2278 (6)</td>
                                <td>0.2479 (1)</td>
                                <td>0.4019 (4)</td>
                                <td>0.1484 (12)</td>
                                <td>0.1563 (1)</td>
                            </tr>
                            <tr valign="top">
                                <td>Triptans</td>
                                <td>0.1739 (10)</td>
                                <td>0.360 (4)</td>
                                <td>0.2569 (13)</td>
                                <td>0.0690 (&#60;1)</td>
                                <td>0.2750 (8)</td>
                            </tr>
                            <tr valign="top">
                                <td>Urinary<break />incontinence</td>
                                <td>0.3697 (24)</td>
                                <td>0.5243 (19)</td>
                                <td>0.5405 (10)</td>
                                <td>0.4444 (13)</td>
                                <td>0.4317 (30)</td>
                            </tr>
                            <tr valign="bottom">
                                <td>Average<sup>b</sup>
                                </td>
                                <td>0.3039 (18)</td>
                                <td>0.3683 (13)</td>
                                <td>0.3437 (14)</td>
                                <td>0.1365 (5)</td>
                                <td>0.3116 (17)</td>
                            </tr>
                        </tbody>
                    </table>
                    <table-wrap-foot>
                        <fn id="table3fn1">
                            <p>
                                <sup>a</sup>Both 5% and 12% have F<sub>1</sub> = 0.4363. The average of 5% and 12% (8.5%) is taken to calculate the average value on the last row of the table.</p>
                        </fn>
                        <fn id="table3fn2">
                            <p>
                                <sup>b</sup>&#60;1% is considered as 1% for calculating the average percentage.</p>
                        </fn>
                    </table-wrap-foot>
                </table-wrap>
            </sec>
            <sec>
                <title>Composited Elements Performance</title>
                <p>Different MEDLINE elements play different roles in the systematic review process, and their corresponding performance varied greatly as described above. To further explore their predictive abilities, we examined their collaborative performances. In total we examined 22 combinations and chose the top WSS95 performance of 6 combinations (see <xref ref-type="table" rid="table4">Table 4</xref>). Each of the 6 combination performances has an average of more than 36% WSS95. <xref ref-type="table" rid="table5">Table 5</xref> shows the F<sub>1</sub> performance of the 6 combinations.</p>
                <p>We also conducted statistical analysis with repeated ANOVA for the composited elements performance. For WSS95, the results show that there is no statistical difference in WSS95 performance across the 6 combinations (<italic>P</italic>=.332). For F<sub>1</sub> performance, there is also no statistical significant difference across the 6 combinations (<italic>P</italic>=.069).</p>
                <p>In summary, we found that the predictive ability of MEDLINE elements varies according to systematic review topics. Overall, TI and PT have better WSS95 performance on average but are not statistically different. AB has the best average F<sub>1</sub> scores and is statistically better than TI.</p>
                <table-wrap position="float" id="table4">
                    <label>Table 4</label>
                    <caption>
                        <p>WSS95 of the top 6 combinations.</p>
                    </caption>
                    <table width="578" border="0" cellpadding="7" cellspacing="0" rules="groups" frame="hsides">
                        <col width="147" />
                        <col width="52" />
                        <col width="52" />
                        <col width="52" />
                        <col width="52" />
                        <col width="52" />
                        <col width="72" />
                        <thead>
                            <tr valign="top">
                                <td>SR report topic</td>
                                <td>TI+AB</td>
                                <td>TI+AB<break />+MH</td>
                                <td>TI+AB<break />+PT</td>
                                <td>TI+AB<break />+AU</td>
                                <td>TI+AB<break />+PT+AU</td>
                                <td>TI+AB+MH<break />+PT+AU</td>
                            </tr>
                        </thead>
                        <tbody>
                            <tr valign="top">
                                <td>ACE inhibitors</td>
                                <td>76.38</td>
                                <td>76.85</td>
                                <td>74.29</td>
                                <td>75.79</td>
                                <td>73.70</td>
                                <td>75.08</td>
                            </tr>
                            <tr valign="top">
                                <td>ADHD</td>
                                <td>80.38</td>
                                <td>79.79</td>
                                <td>67.92</td>
                                <td>80.14</td>
                                <td>67.92</td>
                                <td>56.17</td>
                            </tr>
                            <tr valign="top">
                                <td>Antihistamines</td>
                                <td>16.13</td>
                                <td>10.65</td>
                                <td>24.52</td>
                                <td>16.13</td>
                                <td>24.52</td>
                                <td>18.39</td>
                            </tr>
                            <tr valign="top">
                                <td>Atypical antipsychotics</td>
                                <td>20.89</td>
                                <td>14.20</td>
                                <td>17.95</td>
                                <td>20.63</td>
                                <td>17.77</td>
                                <td>14.38</td>
                            </tr>
                            <tr valign="top">
                                <td>Beta blockers</td>
                                <td>60.14</td>
                                <td>60.09</td>
                                <td>65.01</td>
                                <td>60.96</td>
                                <td>64.72</td>
                                <td>65.21</td>
                            </tr>
                            <tr valign="top">
                                <td>Calcium channel blockers</td>
                                <td>18.23</td>
                                <td>18.64</td>
                                <td>17.32</td>
                                <td>18.39</td>
                                <td>17.49</td>
                                <td>22.82</td>
                            </tr>
                            <tr valign="top">
                                <td>Estrogens</td>
                                <td>33.42</td>
                                <td>36.14</td>
                                <td>22.55</td>
                                <td>33.97</td>
                                <td>22.55</td>
                                <td>29.08</td>
                            </tr>
                            <tr valign="top">
                                <td>NSAIDS</td>
                                <td>72.26</td>
                                <td>75.57</td>
                                <td>77.35</td>
                                <td>70.48</td>
                                <td>76.34</td>
                                <td>77.86</td>
                            </tr>
                            <tr valign="top">
                                <td>Opioids</td>
                                <td>6.01</td>
                                <td>11.75</td>
                                <td>8.98</td>
                                <td>5.95</td>
                                <td>8.98</td>
                                <td>12.17</td>
                            </tr>
                            <tr valign="top">
                                <td>Oral hypoglycemics</td>
                                <td>11.33</td>
                                <td>13.12</td>
                                <td>13.52</td>
                                <td>11.13</td>
                                <td>13.52</td>
                                <td>12.72</td>
                            </tr>
                            <tr valign="top">
                                <td>Proton pump inhibitors</td>
                                <td>19.20</td>
                                <td>21.31</td>
                                <td>19.65</td>
                                <td>19.05</td>
                                <td>19.65</td>
                                <td>20.11</td>
                            </tr>
                            <tr valign="top">
                                <td>Skeletal muscle relaxants</td>
                                <td>41.94</td>
                                <td>46.44</td>
                                <td>58.55</td>
                                <td>41.87</td>
                                <td>58.49</td>
                                <td>60.01</td>
                            </tr>
                            <tr valign="top">
                                <td>Statins</td>
                                <td>29.10</td>
                                <td>27.11</td>
                                <td>27.80</td>
                                <td>30.96</td>
                                <td>27.71</td>
                                <td>26.07</td>
                            </tr>
                            <tr valign="top">
                                <td>Triptans</td>
                                <td>48.29</td>
                                <td>51.71</td>
                                <td>39.64</td>
                                <td>50.52</td>
                                <td>39.79</td>
                                <td>40.98</td>
                            </tr>
                            <tr valign="top">
                                <td>Urinary incontinence</td>
                                <td>12.84</td>
                                <td>11.01</td>
                                <td>20.80</td>
                                <td>12.84</td>
                                <td>20.80</td>
                                <td>14.37</td>
                            </tr>
                            <tr valign="top">
                                <td>Average</td>
                                <td>36.44</td>
                                <td>36.96</td>
                                <td>37.06</td>
                                <td>36.59</td>
                                <td>36.93</td>
                                <td>36.35</td>
                            </tr>
                        </tbody>
                    </table>
                </table-wrap>
                <table-wrap position="float" id="table5">
                    <label>Table 5</label>
                    <caption>
                        <p>F<sub>1</sub> of the top 6 combinations.</p>
                    </caption>
                    <table width="528" border="0" cellpadding="8" cellspacing="0" rules="groups" frame="hsides">
                        <col width="59" />
                        <col width="15" />
                        <col width="28" />
                        <col width="8" />
                        <col width="36" />
                        <col width="5" />
                        <col width="39" />
                        <col width="0" />
                        <col width="52" />
                        <col width="57" />
                        <col width="57" />
                        <thead>
                            <tr valign="top">
                                <td colspan="2">SR report topic</td>
                                <td colspan="2">TI+AB<break />F<sub>1</sub> (%)</td>
                                <td colspan="2">TI+AB+MH<break />F<sub>1</sub> (%)</td>
                                <td colspan="2">TI+AB+PT<break />F<sub>1</sub> (%)</td>
                                <td>TI+AB+AU<break />F<sub>1</sub> (%)</td>
                                <td>TI+AB+PT+AU<break />F<sub>1</sub> (%)</td>
                                <td>TI+AB+MH+PT+AU<break />F<sub>1</sub> (%)</td>
                            </tr>
                        </thead>
                        <tbody>
                            <tr valign="top">
                                <td colspan="2">ACE inhibitors</td>
                                <td colspan="2">0.4156 (1)</td>
                                <td colspan="2">0.4000 (2)</td>
                                <td colspan="2">0.4051 (1)</td>
                                <td>0.3902 (2)</td>
                                <td>0.3971 (4)</td>
                                <td>0.3774 (3)</td>
                            </tr>
                            <tr valign="top">
                                <td colspan="2">ADHD</td>
                                <td colspan="2">0.4000 (3)</td>
                                <td colspan="2">0.4688 (5)</td>
                                <td colspan="2">0.5455 (4)</td>
                                <td>0.4286 (6)</td>
                                <td>0.5306 (3)</td>
                                <td>0.5818 (4)</td>
                            </tr>
                            <tr valign="top">
                                <td colspan="2">Antihistamines</td>
                                <td colspan="2">0.3226 (5)</td>
                                <td colspan="2">0.3333 (10)</td>
                                <td colspan="2">0.2903 (15)</td>
                                <td>0.3226 (5)</td>
                                <td>0.2903 (15)</td>
                                <td>0.2813 (15)</td>
                            </tr>
                            <tr valign="top">
                                <td colspan="2">Atypical<break />antipsychotics</td>
                                <td colspan="2">0.4364 (16)</td>
                                <td colspan="2">0.4241 (15)</td>
                                <td colspan="2">0.4887 (15)</td>
                                <td>0.4411 (17)</td>
                                <td>0.4856 (15)</td>
                                <td>0.4606 (15)</td>
                            </tr>
                            <tr valign="top">
                                <td colspan="2">Beta blockers</td>
                                <td colspan="2">0.2800 (3)</td>
                                <td colspan="2">0.3043 (2)</td>
                                <td colspan="2">0.3590 (2)</td>
                                <td>0.2667 (3)</td>
                                <td>0.3596 (2)</td>
                                <td>0.3333 (3)</td>
                            </tr>
                            <tr valign="top">
                                <td colspan="2">Calcium channel<break />blockers</td>
                                <td colspan="2">0.2335 (8)</td>
                                <td colspan="2">0.2620 (11)</td>
                                <td colspan="2">0.2804 (9)</td>
                                <td>0.2323 (8)</td>
                                <td>0.2816 (9)</td>
                                <td>0.2995 (9)</td>
                            </tr>
                            <tr valign="top">
                                <td colspan="2">Estrogens</td>
                                <td colspan="2">0.6000 (30)</td>
                                <td colspan="2">0.6237 (29)</td>
                                <td colspan="2">0.6047 (25)</td>
                                <td>0.5979 (31)</td>
                                <td>0.6118 (24)</td>
                                <td>0.6171 (26)</td>
                            </tr>
                            <tr valign="top">
                                <td colspan="2">NSAIDS</td>
                                <td colspan="2">0.6667 (16)</td>
                                <td colspan="2">0.6154 (16)</td>
                                <td colspan="2">0.6966 (12)</td>
                                <td>0.6471 (16)</td>
                                <td>0.6809 (13)</td>
                                <td>0.6667 (15)</td>
                            </tr>
                            <tr valign="top">
                                <td colspan="2">Opioids</td>
                                <td colspan="2">0.3000 (0)</td>
                                <td colspan="2">0.3158 (&#60;1)</td>
                                <td colspan="2">0.3000 (&#60;1)</td>
                                <td>0.3000 (&#60;1)</td>
                                <td>0.3000 (&#60;1)</td>
                                <td>0.3158 (&#60;1)</td>
                            </tr>
                            <tr valign="top">
                                <td colspan="2">Oral hypoglycemics</td>
                                <td colspan="2">0.4497 (90)</td>
                                <td colspan="2">0.4541 (88)</td>
                                <td colspan="2">0.4553 (86)</td>
                                <td>0.4489 (92)</td>
                                <td>0.4561 (75)</td>
                                <td>0.4635 (82)</td>
                            </tr>
                            <tr valign="top">
                                <td colspan="2">Proton pump<break />inhibitors</td>
                                <td colspan="2">0.4384 (7)</td>
                                <td colspan="2">0.4737 (5)</td>
                                <td colspan="2">0.5172 (5)</td>
                                <td>0.4552 (7)</td>
                                <td>0.5455 (5)</td>
                                <td>0.5079 (6)</td>
                            </tr>
                            <tr valign="top">
                                <td colspan="2">Skeletal muscle<break />relaxants</td>
                                <td colspan="2">0.2222 (1)</td>
                                <td colspan="2">0.2353 (&#60;1)</td>
                                <td colspan="2">0.2500 (&#60;1)</td>
                                <td>0.2222 (1)</td>
                                <td>0.2500 (&#60;1)</td>
                                <td>0.2667 (&#60;1)</td>
                            </tr>
                            <tr valign="top">
                                <td colspan="2">Statins</td>
                                <td colspan="2">0.2994 (2)</td>
                                <td colspan="2">0.3281 (1)</td>
                                <td colspan="2">0.3382 (1)</td>
                                <td>0.2959 (2)</td>
                                <td>0.3358 (2)</td>
                                <td>0.3465 (1)</td>
                            </tr>
                            <tr valign="top">
                                <td colspan="2">Triptans</td>
                                <td colspan="2">0.3636 (3)</td>
                                <td colspan="2">0.3913 (3)</td>
                                <td colspan="2">0.3556 (3)</td>
                                <td>0.3556 (3)</td>
                                <td>0.3529 (4)</td>
                                <td>0.3913 (3)</td>
                            </tr>
                            <tr valign="top">
                                <td colspan="2">Urinary incontinence</td>
                                <td colspan="2">0.5063 (12)</td>
                                <td colspan="2">0.5347 (19)</td>
                                <td colspan="2">0.5505 (21)</td>
                                <td>0.5263 (11)</td>
                                <td>0.5507 (9)</td>
                                <td>0.5843 (15)</td>
                            </tr>
                            <tr valign="bottom">
                                <td colspan="2">Average<sup>a</sup>
                                </td>
                                <td colspan="2">0.3956 (13)</td>
                                <td colspan="2">0.4110 (14)</td>
                                <td colspan="2">0.4291 (14)</td>
                                <td>0.3954 (14)</td>
                                <td>0.4286 (12)</td>
                                <td>0.4329 (13)</td>
                            </tr>
                        </tbody>
                    </table>
                    <table-wrap-foot>
                        <fn id="table5fn1">
                            <p>
                                <sup>a</sup>&#60;1% is considered as 1% for calculating the average percentage.</p>
                        </fn>
                    </table-wrap-foot>
                </table-wrap>
            </sec>
            <sec>
                <title>Performance Comparison With Existing Literature</title>
                <p>Here we also compared our WSS95 performance with existing machine learning model training approaches (we were not able to compare the F<sub>1</sub> performances as they were not provided). Since TI+AB+PT has the simplest combination and its performance is equivalent or better than others, we chose TI+AB+PT (weight setting = 1:1:1) to compare against existing machine learning model training approaches, including voting perceptron-based automated citation classification system (VP), factorized complement na&#239;ve Bayes with weight engineering (FCNB/WE) and support vector machine (SVM) (<xref ref-type="table" rid="table6">Table 6</xref>).</p>
                <table-wrap position="float" id="table6">
                    <label>Table 6</label>
                    <caption>
                        <p>WSS95 comparison with the Cohen and Matwin systems across 15 SR topics.</p>
                    </caption>
                    <table width="528" border="0" cellpadding="7" cellspacing="0" rules="groups" frame="hsides">
                        <col width="147" />
                        <col width="71" />
                        <col width="80" />
                        <col width="85" />
                        <col width="75" />
                        <thead>
                            <tr valign="bottom">
                                <td>SR report topic</td>
                                <td>Cohen 2006 [<xref ref-type="bibr" rid="ref7">7</xref>]<break />(VP<sup>a</sup>)</td>
                                <td>Cohen 2008 [<xref ref-type="bibr" rid="ref12">12</xref>]<break />(SVM<sup>b</sup>)</td>
                                <td>Matwin 2010 [<xref ref-type="bibr" rid="ref15">15</xref>]<break />(FCNB/WE<sup>c</sup>)</td>
                                <td>Our study <break />(TI+AB+PT)</td>
                            </tr>
                        </thead>
                        <tbody>
                            <tr valign="top">
                                <td>ACE inhibitors</td>
                                <td>56.61</td>
                                <td>73.30</td>
                                <td>52.30</td>
                                <td>74.29</td>
                            </tr>
                            <tr valign="top">
                                <td>ADHD</td>
                                <td>67.95</td>
                                <td>52.60</td>
                                <td>62.20</td>
                                <td>67.92</td>
                            </tr>
                            <tr valign="top">
                                <td>Antihistamines</td>
                                <td>0</td>
                                <td>23.60</td>
                                <td>14.90</td>
                                <td>24.52</td>
                            </tr>
                            <tr valign="top">
                                <td>Atypical antipsychotics</td>
                                <td>14.11</td>
                                <td>17.00</td>
                                <td>20.60</td>
                                <td>17.95</td>
                            </tr>
                            <tr valign="top">
                                <td>Beta blockers</td>
                                <td>28.44</td>
                                <td>46.50</td>
                                <td>36.70</td>
                                <td>65.01</td>
                            </tr>
                            <tr valign="top">
                                <td>Calcium channel blockers</td>
                                <td>12.21</td>
                                <td>43.00</td>
                                <td>23.40</td>
                                <td>17.32</td>
                            </tr>
                            <tr valign="top">
                                <td>Estrogens</td>
                                <td>18.34</td>
                                <td>41.40</td>
                                <td>37.50</td>
                                <td>22.55</td>
                            </tr>
                            <tr valign="top">
                                <td>NSAIDS</td>
                                <td>49.67</td>
                                <td>67.20</td>
                                <td>52.80</td>
                                <td>77.35</td>
                            </tr>
                            <tr valign="top">
                                <td>Opioids</td>
                                <td>13.32</td>
                                <td>36.40</td>
                                <td>55.40</td>
                                <td>8.98</td>
                            </tr>
                            <tr valign="top">
                                <td>Oral hypoglycemics</td>
                                <td>8.96</td>
                                <td>13.60</td>
                                <td>8.50</td>
                                <td>13.52</td>
                            </tr>
                            <tr valign="top">
                                <td>Proton pump inhibitors</td>
                                <td>27.68</td>
                                <td>32.80</td>
                                <td>22.90</td>
                                <td>19.65</td>
                            </tr>
                            <tr valign="top">
                                <td>Skeletal muscle relaxants</td>
                                <td>0</td>
                                <td>37.40</td>
                                <td>26.50</td>
                                <td>58.55</td>
                            </tr>
                            <tr valign="top">
                                <td>Statins</td>
                                <td>24.71</td>
                                <td>49.10</td>
                                <td>31.50</td>
                                <td>27.80</td>
                            </tr>
                            <tr valign="top">
                                <td>Triptans</td>
                                <td>3.37</td>
                                <td>34.60</td>
                                <td>27.40</td>
                                <td>39.64</td>
                            </tr>
                            <tr valign="top">
                                <td>Urinary incontinence</td>
                                <td>26.14</td>
                                <td>43.20</td>
                                <td>29.60</td>
                                <td>20.80</td>
                            </tr>
                            <tr valign="top">
                                <td>Average</td>
                                <td>23.43</td>
                                <td>40.80</td>
                                <td>33.50</td>
                                <td>37.06</td>
                            </tr>
                        </tbody>
                    </table>
                    <table-wrap-foot>
                        <fn id="table6fn1">
                            <p>
                                <sup>a</sup>VP: voting Perceptron-based automated citation classification system</p>
                        </fn>
                        <fn id="table6fn2">
                            <p>
                                <sup>b</sup>FCNB/WE: factorized complement na&#239;ve Bayes with weight engineering</p>
                        </fn>
                        <fn id="table6fn3">
                            <p>
                                <sup>c</sup>SVM: support vector machine</p>
                        </fn>
                    </table-wrap-foot>
                </table-wrap>
                <p>The repeated ANOVA test shows significant different across four studies (<italic>P</italic>=.005). The pairwise comparison with Hommel adjustment (<xref ref-type="table" rid="table7">Table 7</xref>) shows that there is no significant difference between our study and either Cohen 2008 [<xref ref-type="bibr" rid="ref12">12</xref>] or Matwin 2010 [<xref ref-type="bibr" rid="ref15">15</xref>] <italic>(P</italic>=.4979, .4979) but is significantly better than Cohen 2006 [<xref ref-type="bibr" rid="ref7">7</xref>] (<italic>P</italic>=.0475). In summary, our methods provide competitive results to traditional machine learning model training approaches.</p>
                <p>We were not able to compare side by side with the Wallace group [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref14">14</xref>] because they used different systematic reviews. Their performance is by far the best among machine learning model training approaches (nearly 50% work reduction without missing any relevant articles) as they incorporate active learning with user interaction, which accepts feedback from users (similar to our Step D in <xref ref-type="fig" rid="figure3">Figure 3</xref>) [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref14">14</xref>]. This outcome is predictable as machine learning uses training data to model the classifier. With a large amount of training data, the classifier can perform almost perfectly. However, it is encouraging to us that without using algorithms to formulate a classification model, we are currently able to perform similarly to the model training approaches.</p>
                <table-wrap position="float" id="table7">
                    <label>Table 7</label>
                    <caption>
                        <p>The P values of pairwise comparison of four studies.</p>
                    </caption>
                    <table width="504" border="0" cellpadding="7" cellspacing="0" rules="groups" frame="hsides">
                        <col width="82" />
                        <col width="82" />
                        <col width="76" />
                        <col width="95" />
                        <col width="100" />
                        <thead>
                            <tr valign="top">
                                <td>
                                    <break />
                                </td>
                                <td>Cohen 2006</td>
                                <td>Cohen 2008</td>
                                <td>Matwin 2010</td>
                                <td>Our study (TI+AB+PT)</td>
                            </tr>
                        </thead>
                        <tbody>
                            <tr valign="top">
                                <td>Cohen 2006</td>
                                <td>&#8212;</td>
                                <td>0.0012</td>
                                <td>0.0433</td>
                                <td>0.0475</td>
                            </tr>
                            <tr valign="top">
                                <td>Cohen 2008</td>
                                <td>0.0012</td>
                                <td>&#8212;</td>
                                <td>0.0649</td>
                                <td>0.4979</td>
                            </tr>
                            <tr valign="top">
                                <td>Matwin 2010</td>
                                <td>0.0433</td>
                                <td>0.0649</td>
                                <td>&#8212;</td>
                                <td>0.4979</td>
                            </tr>
                            <tr valign="top">
                                <td>Our study</td>
                                <td>0.0475</td>
                                <td>0.4979</td>
                                <td>0.4979</td>
                                <td>&#8212;</td>
                            </tr>
                        </tbody>
                    </table>
                </table-wrap>
            </sec>
            <sec>
                <title>Performance With Weight Parameters</title>
                <p>Since different systematic reviews have diverse scopes (for example, one may require sufficient study information from an AB while another may have strict criteria on PT), we were interested in whether different weight parameters would alter the performance. We conducted experiments on different weight settings (eg, TI:PT:AU=3:1:2, TI:PT:AU=2:2:1, TI:PT:AU=3:2:1). The results revealed that when one element&#8217;s weight was increased to achieve a higher performance for some reports, some other reports would have performance degradation. Overall, we could not find a universal weight setting that benefited all reports. This may be explained in part by the diverse scopes captured in different systematic reviews. In addition, although some weighted combinations bring better global performance (ie, average WSS95 among 15 reports), the enhancement from the baseline (elements in the combination are equally weighted) is limited. For example, consider the combination of TI+PT+AU, the baseline performance (TI:PT:AU=1:1:1) evaluated by average WSS95 is 35.45%, while the performance of its weighted one (TI:PT:AU=3:1:2) (37.30%) gains less than 2%. There is not much improvement with weighted parameters.</p>
            </sec>
            <sec>
                <title>Interpreting the Inconsistency of WSS95 and F<sub>1</sub>
                </title>
                <p>During our experiments, we also discovered inconsistencies in performance with respect to WSS95 and F<sub>1</sub>. For example, some combinations had high F<sub>1</sub> performance with low WSS95 and vice versa. We examined the recall performance during the entire recommendation process. <xref ref-type="fig" rid="figure6">Figure 6</xref> presents the performance curves of the Proton Pump Inhibitors systematic review with two different element combinations, TI+AU (<xref ref-type="fig" rid="figure6">Figure 6</xref>A) and TI+AB+PT+AU (<xref ref-type="fig" rid="figure6">Figure 6</xref>B) (all equally weighted). The x-axis represents the percentage of articles screened (or recommended); the y-axis represents the recall rate. From the <xref ref-type="fig" rid="figure6">Figure 6</xref>, we see that in the early screening stage (5% of articles screened), curve B (recall of 70%) is steeper than curve A (recall of 40%). This also shows in their F<sub>1</sub> scores: the highest F<sub>1</sub> scores of curve A and B are 0.3778 and 0.5455, respectively, during the early screening stage. However, at the later stage, curve A reaches the recall of 100% faster than curve B after screening 60% of articles (WSS95 scores of curve A and B are 46.51% and 19.65%, respectively). In summary, current performance measures using WSS95, area under the curve, precision, and recall could not reflect the performance over time. Some elements may accelerate the performance in the beginning of the recommendation (screening) process. Using multiple performance measures and especially including the highest F<sub>1</sub> at a certain time point can better help us recognize the strength and weakness of different elements during the entire screening process</p>
                <fig id="figure6" position="float">
                    <label>Figure 6</label>
                    <caption>
                        <p>Proton Pump Inhibitors recall performance during the recommendation process using two different element combinations.</p>
                    </caption>
                    <graphic xlink:href="medinform_v3i3e28_fig6.png" alt-version="no" mimetype="image" position="float" xlink:type="simple" />
                </fig>
            </sec>
        </sec>
        <sec sec-type="discussion">
            <title>Discussion</title>
            <sec>
                <title>Customizable Weight Parameters May Enhance Performance More Efficiently</title>
                <p>Due to the fact that different systematic reviews have different review scopes, we could not identify one universal weight setting which could be successfully applied to every systematic review. A similar idea was mentioned in Matwin&#8217;s work [<xref ref-type="bibr" rid="ref15">15</xref>], where weight parameters (or weight multipliers) were tunable and being modified with regards to different systematic reviews. While different systematic reviews should have different weight multiplier values, we also agree that the process of computing such a value for every systematic review would be very time consuming [<xref ref-type="bibr" rid="ref15">15</xref>]. Therefore, instead of finding the best weight parameters for each systematic review, flexible, customizable weight parameters for human reviewers based on their systematic review scopes and screening priority would be more useful and practical. Without adjusting weight parameters, our average performance is higher than the FCNB/WE approach [<xref ref-type="bibr" rid="ref15">15</xref>] (<xref ref-type="table" rid="table6">Table 6</xref>). It is likely that we could improve even further when adjustable weight parameters are provided to human reviewers.</p>
            </sec>
            <sec>
                <title>Moving Toward an Efficient and Generalizable Approach</title>
                <p>Currently the work of biomedical text classification for the purpose of reducing systematic review workload has mainly used machine learning model training approaches. Na&#239;ve Bayes and SVM are two widely applied machine learning algorithms. Although these machine learning approaches provide excellent performance in text classification on specific systematic review topics, it is a challenge to apply the existing machine learning algorithms to other new systematic review topics. It could be time consuming to construct training models as well [<xref ref-type="bibr" rid="ref15">15</xref>]. In addition, the implementation of machine learning approaches usually requires an understanding of the algorithm. For example, operators need to choose a kernel or tune the setting of parameters for the SVM algorithm. Thus, it is difficult to apply the approach to a new systematic review topic without a well-trained classification model or without significant machine learning knowledge. Other approaches, such as text mining or statistical approaches, were also studied to facilitate the systematic review process [<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref31">31</xref>], but they also rely heavily on prior decisions to find key terms to differentiate between the relevant and irrelevant classes, which is very similar to supervised machine learning.</p>
                <p>Overcoming the limitations mentioned above, we provided a generalizable approach which can be easily deployed to facilitate any systematic review. Also, because we established an article network providing similarity relationship between articles, the iterative interactive recommendation process takes almost no time. Currently, our processing time to construct an article network takes from several seconds to several minutes for 300 to 3500 articles, but the recommendation step is real-time. This processing time is reasonable considering the non-trivial steps of building article networks. To be specific, this is polynomial time processing, not linear time processing. In our study, the backend programs for the computation of similarity matrixes are written in C/C++, which is the most efficient approach from the perspective of computer architecture and compiler. We also plan to improve the time responses for larger systematic reviews that may contain ten thousand articles or more. Most importantly, our approach can be applied to any systematic review topic and nontechnical human reviewers can use it with ease.</p>
            </sec>
            <sec>
                <title>Study Limitation</title>
                <p>This study only uses 15 DERP reports for evaluation. Although it is our assumption that our approach will be applicable globally, datasets from other systematic review teams are needed to further demonstrate our hypothesis. Our future plans include collaborating with other systematic review teams.</p>
            </sec>
            <sec>
                <title>Future Direction</title>
                <p>As we have discussed in the Methods section, different article elements have different predictive abilities regarding the evaluation scheme of WSS95 or F<sub>1</sub> score. With a better F<sub>1</sub> score and a lower WSS95, combinations containing AB or MH are more likely to elicit good performance in the beginning but have difficulty reaching 100% recall. On the other hand, although the combination of TI, PT, and AU can reach a better overall workload saved, the recall rises slowly (low accuracy) in the beginning of the recommendation process. This inspires us to utilize multiple types of weight settings and take advantage of different article element strengths during different recommendation phases (early-, mid-, and late-phases). We plan to implement automatic detection and adjustment when information from elements has been exhausted, which indicates the time to alter the combination of elements and weight parameters. For instance, when a series of N recommended articles is classified as excluded by human reviewers, we take it as a signal for adjustment as the current setting can no longer provide a good recommendation. Another example is to first apply the combination of AB and MH, as they provide high accuracy in the early recommendation stage, and then automatically adjust to the combination of TI, PT, and AU in the subsequent phase. Further research is also necessary to investigate proper adjustments of weight parameters under different conditions.</p>
                <p>In the near future, we will also provide visualized article networks where relationships between articles could be intuitively represented and comprehended by humans. Network-based analysis will be conducted and network metrics like graph diameter, centrality, and module classes (by communication detection) will be reported. Such visualizations have the potential to enable the identification of clusters of articles and knowledge gaps in a targeted area. Lower density in such visualizations of the network could also indicate fewer related articles published or vice versa.</p>
            </sec>
            <sec>
                <title>Conclusions</title>
                <p>We demonstrated a new approach to assist the systematic review article screening process. We established article networks based on article similarity that facilitate the process of interactive article recommendation. We calculated article similarities using MEDLINE elements and examined the predictive ability of the MEDLINE element(s). We found that TI and PT have the best WSS95 performance, and AB and PT provide the best F<sub>1</sub> scores during the early stage of the recommendation process. However, no statistical difference was found.</p>
                <p>Using our approach, we are able to achieve an average of 37% WSS95 with equally weighted combination of TI, AB, and PT. The statistical analysis also demonstrated that it is competitive with existing approaches. Based on findings and lessons learned from this study, we are currently deploying the approach into a prototype public online system, ArticleNet, to assist the article screening process.</p>
            </sec>
        </sec>
    </body>
    <back>
        <glossary>
            <title>Abbreviations</title>
            <def-list>
                <def-item>
                    <term id="abb1">AB</term>
                    <def>
                        <p>abstract</p>
                    </def>
                </def-item>
                <def-item>
                    <term id="abb2">ANOVA</term>
                    <def>
                        <p>analysis over variance</p>
                    </def>
                </def-item>
                <def-item>
                    <term id="abb3">AU</term>
                    <def>
                        <p>author</p>
                    </def>
                </def-item>
                <def-item>
                    <term id="abb4">DERP</term>
                    <def>
                        <p>Drug Effectiveness Review Project</p>
                    </def>
                </def-item>
                <def-item>
                    <term id="abb5">EBM</term>
                    <def>
                        <p>evidence-based medicine</p>
                    </def>
                </def-item>
                <def-item>
                    <term id="abb6">EX</term>
                    <def>
                        <p>excluded</p>
                    </def>
                </def-item>
                <def-item>
                    <term id="abb7">F<sub>1</sub>
                    </term>
                    <def>
                        <p>F-measure</p>
                    </def>
                </def-item>
                <def-item>
                    <term id="abb8">FCNB/WE</term>
                    <def>
                        <p>factorized complement na&#239;ve Bayes with weight engineering</p>
                    </def>
                </def-item>
                <def-item>
                    <term id="abb9">IN</term>
                    <def>
                        <p>included</p>
                    </def>
                </def-item>
                <def-item>
                    <term id="abb10">MH</term>
                    <def>
                        <p>MeSH, or medical subject heading</p>
                    </def>
                </def-item>
                <def-item>
                    <term id="abb11">PMID</term>
                    <def>
                        <p>PubMed Indentifier</p>
                    </def>
                </def-item>
                <def-item>
                    <term id="abb12">PT</term>
                    <def>
                        <p>publication type</p>
                    </def>
                </def-item>
                <def-item>
                    <term id="abb13">SVM</term>
                    <def>
                        <p>support vector machine</p>
                    </def>
                </def-item>
                <def-item>
                    <term id="abb14">TI</term>
                    <def>
                        <p>title</p>
                    </def>
                </def-item>
                <def-item>
                    <term id="abb15">VP</term>
                    <def>
                        <p>voting perceptron-based automated citation classification system</p>
                    </def>
                </def-item>
                <def-item>
                    <term id="abb16">WSS95</term>
                    <def>
                        <p>worked saved over sampling at 95% recall</p>
                    </def>
                </def-item>
            </def-list>
        </glossary>
        <ack>
            <p>Special thanks to Dr Soledad Fernandez who helped verify our statistical results. The authors also thank Dr Marian McDonagh for her suggestions for the project.</p>
        </ack>
        <fn-group>
            <fn fn-type="conflict">
                <p>None declared.</p>
            </fn>
        </fn-group>
        <ref-list>
            <ref id="ref1">
                <label>1</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Yuan</surname>
                            <given-names>Y</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Hunt</surname>
                            <given-names>RH</given-names>
                        </name>
                    </person-group>
                    <article-title>Systematic reviews: the good, the bad, and the ugly</article-title>
                    <source>Am J Gastroenterol</source>
                    <year>2009</year>
                    <month>05</month>
                    <volume>104</volume>
                    <issue>5</issue>
                    <fpage>1086</fpage>
                    <lpage>1092</lpage>
                    <pub-id pub-id-type="doi">10.1038/ajg.2009.118</pub-id>
                    <pub-id pub-id-type="medline">19417748</pub-id>
                    <pub-id pub-id-type="pii">ajg2009118</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref2">
                <label>2</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Akobeng</surname>
                            <given-names>AK</given-names>
                        </name>
                    </person-group>
                    <article-title>Understanding systematic reviews and meta-analysis</article-title>
                    <source>Arch Dis Child</source>
                    <year>2005</year>
                    <month>08</month>
                    <volume>90</volume>
                    <issue>8</issue>
                    <fpage>845</fpage>
                    <lpage>848</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://adc.bmj.com/cgi/pmidlookup?view=long&#38;pmid=16040886" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1136/adc.2004.058230</pub-id>
                    <pub-id pub-id-type="medline">16040886</pub-id>
                    <pub-id pub-id-type="pii">90/8/845</pub-id>
                    <pub-id pub-id-type="pmcid">PMC1720526</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref3">
                <label>3</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Mulrow</surname>
                            <given-names>CD</given-names>
                        </name>
                    </person-group>
                    <article-title>Rationale for systematic reviews</article-title>
                    <source>BMJ</source>
                    <year>1994</year>
                    <month>09</month>
                    <day>3</day>
                    <volume>309</volume>
                    <issue>6954</issue>
                    <fpage>597</fpage>
                    <lpage>599</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/8086953" />
                    </comment>
                    <pub-id pub-id-type="medline">8086953</pub-id>
                    <pub-id pub-id-type="pmcid">PMC2541393</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref4">
                <label>4</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Manchikanti</surname>
                            <given-names>L</given-names>
                        </name>
                    </person-group>
                    <article-title>Evidence-based medicine, systematic reviews, and guidelines in interventional pain management, part I: introduction and general considerations</article-title>
                    <source>Pain Physician</source>
                    <year>2008</year>
                    <volume>11</volume>
                    <issue>2</issue>
                    <fpage>161</fpage>
                    <lpage>186</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.painphysicianjournal.com/linkout_vw.php?issn=1533-3159&#38;vol=11&#38;page=161" />
                    </comment>
                    <pub-id pub-id-type="medline">18354710</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref5">
                <label>5</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Lavis</surname>
                            <given-names>JN</given-names>
                        </name>
                    </person-group>
                    <article-title>How can we support the use of systematic reviews in policymaking?</article-title>
                    <source>PLoS Med</source>
                    <year>2009</year>
                    <month>11</month>
                    <volume>6</volume>
                    <issue>11</issue>
                    <fpage>e1000141</fpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pmed.1000141" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1371/journal.pmed.1000141</pub-id>
                    <pub-id pub-id-type="medline">19936223</pub-id>
                    <pub-id pub-id-type="pmcid">PMC2777391</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref6">
                <label>6</label>
                <nlm-citation citation-type="web">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Phillips</surname>
                            <given-names>B</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Ball</surname>
                            <given-names>C</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Sackett</surname>
                            <given-names>D</given-names>
                        </name>
                    </person-group>
                    <source>Oxford Centre for Evidence-Based Medicine (CEBM)</source>
                    <year>2009</year>
                    <access-date>2012-09-10</access-date>
                    <comment>Oxford Centre for Evidence-Based Medicine: Levels of Evidence<ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.cebm.net/index.aspx?o=1025">http://www.cebm.net/index.aspx?o=1025</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6AZnaE7iG</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref7">
                <label>7</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Cohen</surname>
                            <given-names>AM</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Hersh</surname>
                            <given-names>WR</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Peterson</surname>
                            <given-names>K</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Yen</surname>
                            <given-names>PY</given-names>
                        </name>
                    </person-group>
                    <article-title>Reducing workload in systematic review preparation using automated citation classification</article-title>
                    <source>J Am Med Inform Assoc</source>
                    <year>2006</year>
                    <volume>13</volume>
                    <issue>2</issue>
                    <fpage>206</fpage>
                    <lpage>219</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://jamia.oxfordjournals.org/cgi/pmidlookup?view=long&#38;pmid=16357352" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1197/jamia.M1929</pub-id>
                    <pub-id pub-id-type="medline">16357352</pub-id>
                    <pub-id pub-id-type="pii">M1929</pub-id>
                    <pub-id pub-id-type="pmcid">PMC1447545</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref8">
                <label>8</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Glasziou</surname>
                            <given-names>PP</given-names>
                        </name>
                    </person-group>
                    <article-title>Information overload: what's behind it, what's beyond it?</article-title>
                    <source>Med J Aust</source>
                    <year>2008</year>
                    <month>07</month>
                    <day>21</day>
                    <volume>189</volume>
                    <issue>2</issue>
                    <fpage>84</fpage>
                    <lpage>85</lpage>
                    <pub-id pub-id-type="medline">18637773</pub-id>
                    <pub-id pub-id-type="pii">gla10552_fm</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref9">
                <label>9</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Clarke</surname>
                            <given-names>M</given-names>
                        </name>
                    </person-group>
                    <article-title>The Cochrane Collaboration and the Cochrane Library</article-title>
                    <source>Otolaryngol Head Neck Surg</source>
                    <year>2007</year>
                    <month>10</month>
                    <volume>137</volume>
                    <issue>4 Suppl</issue>
                    <fpage>S52</fpage>
                    <lpage>54</lpage>
                    <pub-id pub-id-type="doi">10.1016/j.otohns.2007.05.050</pub-id>
                    <pub-id pub-id-type="medline">17894947</pub-id>
                    <pub-id pub-id-type="pii">S0194-5998(07)00526-8</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref10">
                <label>10</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Shojania</surname>
                            <given-names>KG</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Sampson</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Ansari</surname>
                            <given-names>MT</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Ji</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Doucette</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Moher</surname>
                            <given-names>D</given-names>
                        </name>
                    </person-group>
                    <article-title>How quickly do systematic reviews go out of date? A survival analysis</article-title>
                    <source>Ann Intern Med</source>
                    <year>2007</year>
                    <month>08</month>
                    <day>21</day>
                    <volume>147</volume>
                    <issue>4</issue>
                    <fpage>224</fpage>
                    <lpage>233</lpage>
                    <pub-id pub-id-type="medline">17638714</pub-id>
                    <pub-id pub-id-type="pii">0000605-200708210-00179</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref11">
                <label>11</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Tsafnat</surname>
                            <given-names>G</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Glasziou</surname>
                            <given-names>P</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Choong</surname>
                            <given-names>MK</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Dunn</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Galgani</surname>
                            <given-names>F</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Coiera</surname>
                            <given-names>E</given-names>
                        </name>
                    </person-group>
                    <article-title>Systematic review automation technologies</article-title>
                    <source>Syst Rev</source>
                    <year>2014</year>
                    <volume>3</volume>
                    <fpage>74</fpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.systematicreviewsjournal.com/content/3//74" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1186/2046-4053-3-74</pub-id>
                    <pub-id pub-id-type="medline">25005128</pub-id>
                    <pub-id pub-id-type="pii">2046-4053-3-74</pub-id>
                    <pub-id pub-id-type="pmcid">PMC4100748</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref12">
                <label>12</label>
                <nlm-citation citation-type="confproc">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Cohen</surname>
                            <given-names>AM</given-names>
                        </name>
                    </person-group>
                    <article-title>Optimizing feature representation for automated systematic review work prioritization</article-title>
                    <year>2008</year>
                    <conf-name>Annual Symposium Proceedings/AMIA Symposium</conf-name>
                    <conf-date>2008</conf-date>
                    <conf-loc>Washington, DC</conf-loc>
                    <fpage>121</fpage>
                    <lpage>125</lpage>
                </nlm-citation>
            </ref>
            <ref id="ref13">
                <label>13</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Wallace</surname>
                            <given-names>BC</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Trikalinos</surname>
                            <given-names>TA</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Lau</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Brodley</surname>
                            <given-names>C</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Schmid</surname>
                            <given-names>CH</given-names>
                        </name>
                    </person-group>
                    <article-title>Semi-automated screening of biomedical citations for systematic reviews</article-title>
                    <source>BMC Bioinformatics</source>
                    <year>2010</year>
                    <volume>11</volume>
                    <fpage>55</fpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.biomedcentral.com/1471-2105/11/55" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1186/1471-2105-11-55</pub-id>
                    <pub-id pub-id-type="medline">20102628</pub-id>
                    <pub-id pub-id-type="pii">1471-2105-11-55</pub-id>
                    <pub-id pub-id-type="pmcid">PMC2824679</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref14">
                <label>14</label>
                <nlm-citation citation-type="confproc">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Wallace</surname>
                            <given-names>BC</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Small</surname>
                            <given-names>K</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Brodley</surname>
                            <given-names>CE</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Lau</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Trikalinos</surname>
                            <given-names>TA</given-names>
                        </name>
                    </person-group>
                    <article-title>Deploying an interactive machine learning system in an evidence-based practice center: abstract</article-title>
                    <year>2012</year>
                    <conf-name>2nd ACM SIGHIT International Health Informatics Symposium</conf-name>
                    <conf-date>2012</conf-date>
                    <conf-loc>Miami, Florida</conf-loc>
                </nlm-citation>
            </ref>
            <ref id="ref15">
                <label>15</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Matwin</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Kouznetsov</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Inkpen</surname>
                            <given-names>D</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Frunza</surname>
                            <given-names>O</given-names>
                        </name>
                        <name name-style="western">
                            <surname>O'Blenis</surname>
                            <given-names>P</given-names>
                        </name>
                    </person-group>
                    <article-title>A new algorithm for reducing the workload of experts in performing systematic reviews</article-title>
                    <source>J Am Med Inform Assoc</source>
                    <year>2010</year>
                    <volume>17</volume>
                    <issue>4</issue>
                    <fpage>446</fpage>
                    <lpage>453</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://jamia.oxfordjournals.org/cgi/pmidlookup?view=long&#38;pmid=20595313" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1136/jamia.2010.004325</pub-id>
                    <pub-id pub-id-type="medline">20595313</pub-id>
                    <pub-id pub-id-type="pii">17/4/446</pub-id>
                    <pub-id pub-id-type="pmcid">PMC2995653</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref16">
                <label>16</label>
                <nlm-citation citation-type="book">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Salton</surname>
                            <given-names>G</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Buckley</surname>
                            <given-names>C</given-names>
                        </name>
                    </person-group>
                    <person-group person-group-type="editor">
                        <name name-style="western">
                            <surname>Jones</surname>
                            <given-names>KS</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Willett</surname>
                            <given-names>P</given-names>
                        </name>
                    </person-group>
                    <article-title>Improving retrieval performance by relevance feedback</article-title>
                    <source>Readings in Information Retrieval</source>
                    <year>1997</year>
                    <publisher-loc>Burlington, MA</publisher-loc>
                    <publisher-name>Morgan Kaufmann Publishers Inc</publisher-name>
                    <fpage>355</fpage>
                    <lpage>364</lpage>
                </nlm-citation>
            </ref>
            <ref id="ref17">
                <label>17</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Ruthven</surname>
                            <given-names>I</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Lalmas</surname>
                            <given-names>M</given-names>
                        </name>
                    </person-group>
                    <article-title>A survey on the use of relevance feedback for information access systems</article-title>
                    <source>Knowl Eng Rev</source>
                    <year>2003</year>
                    <volume>18</volume>
                    <issue>2</issue>
                    <fpage>95</fpage>
                    <lpage>145</lpage>
                </nlm-citation>
            </ref>
            <ref id="ref18">
                <label>18</label>
                <nlm-citation citation-type="confproc">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Garfield</surname>
                            <given-names>E</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Pudovkin</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Istomin</surname>
                            <given-names>V</given-names>
                        </name>
                    </person-group>
                    <article-title>Algorithmic citation‐linked historiography: Mapping the literature of science</article-title>
                    <source>Proceedings of the American Society for Information Science and Technology</source>
                    <year>2002</year>
                    <conf-name>ASIS&#38;T</conf-name>
                    <conf-date>2002</conf-date>
                    <conf-loc>Philadelphia, PA</conf-loc>
                </nlm-citation>
            </ref>
            <ref id="ref19">
                <label>19</label>
                <nlm-citation citation-type="web">
                    <source>MEDLINE/PubMed Data Element (Field) Descriptions</source>
                    <access-date>2014-03-08</access-date>
                    <publisher-name>NIH US National Library of Medicine</publisher-name>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.nlm.nih.gov/bsd/mms/medlineelements.html">http://www.nlm.nih.gov/bsd/mms/medlineelements.html</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6axCSptUP</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref20">
                <label>20</label>
                <nlm-citation citation-type="web">
                    <source>OHSU Center for Evidence-Based Policy</source>
                    <access-date>2015-08-21</access-date>
                    <comment>Drug Effectiveness Review Project (DERP) Systematic Drug Class Review Gold Standard Data <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://skynet.ohsu.edu/~cohenaa/systematic-drug-class-review-data.html ">http://skynet.ohsu.edu/~cohenaa/systematic-drug-class-review-data.html</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6axCmYzFa</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref21">
                <label>21</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Kim</surname>
                            <given-names>Seunghee</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Choi</surname>
                            <given-names>Jinwook</given-names>
                        </name>
                    </person-group>
                    <article-title>Improving the performance of text categorization models used for the selection of high quality articles</article-title>
                    <source>Healthc Inform Res</source>
                    <year>2012</year>
                    <month>03</month>
                    <volume>18</volume>
                    <issue>1</issue>
                    <fpage>18</fpage>
                    <lpage>28</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.e-hir.org/journal/viewJournal.html?year=2012&#38;vol=018&#38;num=01&#38;page=18" />
                    </comment>
                    <pub-id pub-id-type="doi">10.4258/hir.2012.18.1.18</pub-id>
                    <pub-id pub-id-type="medline">22509470</pub-id>
                    <pub-id pub-id-type="pmcid">PMC3324751</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref22">
                <label>22</label>
                <nlm-citation citation-type="book">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Tan</surname>
                            <given-names>P-N</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Steinbach</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Kumar</surname>
                            <given-names>V</given-names>
                        </name>
                    </person-group>
                    <source>Introduction to Data Mining</source>
                    <year>2006</year>
                    <publisher-loc>Boston, MA</publisher-loc>
                    <publisher-name>Pearson Addison Wesley</publisher-name>
                </nlm-citation>
            </ref>
            <ref id="ref23">
                <label>23</label>
                <nlm-citation citation-type="web">
                    <source>PubMed Help</source>
                    <access-date>2015-08-21</access-date>
                    <comment>PubMed Stopword List<ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.ncbi.nlm.nih.gov/books/NBK3827/">http://www.ncbi.nlm.nih.gov/books/NBK3827/</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6axDPDpEt</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref24">
                <label>24</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Porter</surname>
                            <given-names>M</given-names>
                        </name>
                    </person-group>
                    <article-title>An algorithm for suffix stripping</article-title>
                    <source>Program</source>
                    <year>1980</year>
                    <volume>14</volume>
                    <issue>3</issue>
                    <fpage>130</fpage>
                    <lpage>137</lpage>
                </nlm-citation>
            </ref>
            <ref id="ref25">
                <label>25</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Bekhuis</surname>
                            <given-names>T</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Tseytlin</surname>
                            <given-names>E</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Mitchell</surname>
                            <given-names>KJ</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Demner-Fushman</surname>
                            <given-names>D</given-names>
                        </name>
                    </person-group>
                    <article-title>Feature engineering and a proposed decision-support system for systematic reviewers of medical evidence</article-title>
                    <source>PLoS One</source>
                    <year>2014</year>
                    <volume>9</volume>
                    <issue>1</issue>
                    <fpage>e86277</fpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pone.0086277" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1371/journal.pone.0086277</pub-id>
                    <pub-id pub-id-type="medline">24475099</pub-id>
                    <pub-id pub-id-type="pii">PONE-D-13-31264</pub-id>
                    <pub-id pub-id-type="pmcid">PMC3903545</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref26">
                <label>26</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Wright</surname>
                            <given-names>SP</given-names>
                        </name>
                    </person-group>
                    <article-title>Adjusted P-values for simultaneous inference</article-title>
                    <source>Biometrics</source>
                    <year>1992</year>
                    <volume>48</volume>
                    <issue>4</issue>
                    <fpage>1005</fpage>
                    <lpage>1013</lpage>
                </nlm-citation>
            </ref>
            <ref id="ref27">
                <label>27</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Blakesley</surname>
                            <given-names>RE</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Mazumdar</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Dew</surname>
                            <given-names>MA</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Houck</surname>
                            <given-names>PR</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Tang</surname>
                            <given-names>G</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Reynolds</surname>
                            <given-names>CF</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Butters</surname>
                            <given-names>MA</given-names>
                        </name>
                    </person-group>
                    <article-title>Comparisons of methods for multiple hypothesis testing in neuropsychological research</article-title>
                    <source>Neuropsychology</source>
                    <year>2009</year>
                    <month>03</month>
                    <volume>23</volume>
                    <issue>2</issue>
                    <fpage>255</fpage>
                    <lpage>264</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/19254098" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1037/a0012850</pub-id>
                    <pub-id pub-id-type="medline">19254098</pub-id>
                    <pub-id pub-id-type="pii">2009-02621-013</pub-id>
                    <pub-id pub-id-type="pmcid">PMC3045855</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref28">
                <label>28</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Bekhuis</surname>
                            <given-names>T</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Demner-Fushman</surname>
                            <given-names>D</given-names>
                        </name>
                    </person-group>
                    <article-title>Towards automating the initial screening phase of a systematic review</article-title>
                    <source>Stud Health Technol Inform</source>
                    <year>2010</year>
                    <volume>160</volume>
                    <issue>Pt 1</issue>
                    <fpage>146</fpage>
                    <lpage>150</lpage>
                    <pub-id pub-id-type="medline">20841667</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref29">
                <label>29</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Kastrin</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Peterlin</surname>
                            <given-names>B</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Hristovski</surname>
                            <given-names>D</given-names>
                        </name>
                    </person-group>
                    <article-title>Chi-square-based scoring function for categorization of MEDLINE citations</article-title>
                    <source>Methods Inf Med</source>
                    <year>2010</year>
                    <volume>49</volume>
                    <issue>4</issue>
                    <fpage>371</fpage>
                    <lpage>378</lpage>
                    <pub-id pub-id-type="doi">10.3414/ME09-01-0009</pub-id>
                    <pub-id pub-id-type="medline">20091016</pub-id>
                    <pub-id pub-id-type="pii">09-01-0009</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref30">
                <label>30</label>
                <nlm-citation citation-type="confproc">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Frunza</surname>
                            <given-names>O</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Inkpen</surname>
                            <given-names>D</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Matwin</surname>
                            <given-names>S</given-names>
                        </name>
                    </person-group>
                    <article-title>Building systematic reviews using automatic text classification techniques</article-title>
                    <year>2010</year>
                    <conf-name>Paper presented at: Proceedings of the 23rd International Conference on Computational Linguistics: Posters</conf-name>
                    <conf-date>2010</conf-date>
                    <conf-loc>Beijing, China</conf-loc>
                </nlm-citation>
            </ref>
            <ref id="ref31">
                <label>31</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Shemilt</surname>
                            <given-names>I</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Simon</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Hollands</surname>
                            <given-names>GJ</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Marteau</surname>
                            <given-names>TM</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Ogilvie</surname>
                            <given-names>D</given-names>
                        </name>
                        <name name-style="western">
                            <surname>O'Mara-Eves</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Kelly</surname>
                            <given-names>MP</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Thomas</surname>
                            <given-names>J</given-names>
                        </name>
                    </person-group>
                    <article-title>Pinpointing needles in giant haystacks: use of text mining to reduce impractical screening workload in extremely large scoping reviews</article-title>
                    <source>Res Synth Methods</source>
                    <year>2014</year>
                    <month>03</month>
                    <volume>5</volume>
                    <issue>1</issue>
                    <fpage>31</fpage>
                    <lpage>49</lpage>
                    <pub-id pub-id-type="doi">10.1002/jrsm.1093</pub-id>
                    <pub-id pub-id-type="medline">26054024</pub-id>
                </nlm-citation>
            </ref>
        </ref-list>
    </back>
</article>