<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMI</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Med Inform</journal-id>
      <journal-title>JMIR Medical Informatics</journal-title>
      <issn pub-type="epub">2291-9694</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v9i9e30401</article-id>
      <article-id pub-id-type="pmid">34499041</article-id>
      <article-id pub-id-type="doi">10.2196/30401</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Review</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Review</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Machine Learning Approaches to Retrieve High-Quality, Clinically Relevant Evidence From the Biomedical Literature: Systematic Review</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Lovis</surname>
            <given-names>Christian</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Kalicoglu</surname>
            <given-names>Halil</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Afzal</surname>
            <given-names>Muhammad</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" corresp="yes" equal-contrib="yes">
          <name name-style="western">
            <surname>Abdelkader</surname>
            <given-names>Wael</given-names>
          </name>
          <degrees>MD, MSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Health Information Research Unit</institution>
            <institution>Department of Health Research Methods, Evidence, and Impact</institution>
            <institution>McMaster University</institution>
            <addr-line>1280 Main St W</addr-line>
            <addr-line>CRL Building, First Floor</addr-line>
            <addr-line>Hamilton, ON, L8S 4K1</addr-line>
            <country>Canada</country>
            <phone>1 647 563 5732</phone>
            <email>Abdelkaw@mcmaster.ca</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-9581-1521</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Navarro</surname>
            <given-names>Tamara</given-names>
          </name>
          <degrees>MLiS</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-2810-6942</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Parrish</surname>
            <given-names>Rick</given-names>
          </name>
          <degrees>DiplT</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-3809-6015</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Cotoi</surname>
            <given-names>Chris</given-names>
          </name>
          <degrees>BEng, EMBA</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-7029-0582</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Germini</surname>
            <given-names>Federico</given-names>
          </name>
          <degrees>MD, MSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-0802-3616</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Iorio</surname>
            <given-names>Alfonso</given-names>
          </name>
          <degrees>MD, PhD, FRCPC</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-3331-8766</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Haynes</surname>
            <given-names>R Brian</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-1453-3196</ext-link>
        </contrib>
        <contrib id="contrib8" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Lokker</surname>
            <given-names>Cynthia</given-names>
          </name>
          <degrees>MSc, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-2436-4290</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Health Information Research Unit</institution>
        <institution>Department of Health Research Methods, Evidence, and Impact</institution>
        <institution>McMaster University</institution>
        <addr-line>Hamilton, ON</addr-line>
        <country>Canada</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Department of Medicine</institution>
        <institution>McMaster University</institution>
        <addr-line>Hamilton, ON</addr-line>
        <country>Canada</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Wael Abdelkader <email>Abdelkaw@mcmaster.ca</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <month>9</month>
        <year>2021</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>9</day>
        <month>9</month>
        <year>2021</year>
      </pub-date>
      <volume>9</volume>
      <issue>9</issue>
      <elocation-id>e30401</elocation-id>
      <history>
        <date date-type="received">
          <day>13</day>
          <month>5</month>
          <year>2021</year>
        </date>
        <date date-type="rev-request">
          <day>2</day>
          <month>7</month>
          <year>2021</year>
        </date>
        <date date-type="rev-recd">
          <day>15</day>
          <month>7</month>
          <year>2021</year>
        </date>
        <date date-type="accepted">
          <day>25</day>
          <month>7</month>
          <year>2021</year>
        </date>
      </history>
      <copyright-statement>©Wael Abdelkader, Tamara Navarro, Rick Parrish, Chris Cotoi, Federico Germini, Alfonso Iorio, R Brian Haynes, Cynthia Lokker. Originally published in JMIR Medical Informatics (https://medinform.jmir.org), 09.09.2021.</copyright-statement>
      <copyright-year>2021</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Informatics, is properly cited. The complete bibliographic information, a link to the original publication on https://medinform.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://medinform.jmir.org/2021/9/e30401" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>The rapid growth of the biomedical literature makes identifying strong evidence a time-consuming task. Applying machine learning to the process could be a viable solution that limits effort while maintaining accuracy.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>The goal of the research was to summarize the nature and comparative performance of machine learning approaches that have been applied to retrieve high-quality evidence for clinical consideration from the biomedical literature.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>We conducted a systematic review of studies that applied machine learning techniques to identify high-quality clinical articles in the biomedical literature. Multiple databases were searched to July 2020. Extracted data focused on the applied machine learning model, steps in the development of the models, and model performance.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>From 3918 retrieved studies, 10 met our inclusion criteria. All followed a supervised machine learning approach and applied, from a limited range of options, a high-quality standard for the training of their model. The results show that machine learning can achieve a sensitivity of 95% while maintaining a high precision of 86%.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>Machine learning approaches perform well in retrieving high-quality clinical studies. Performance may improve by applying more sophisticated approaches such as active learning and unsupervised machine learning approaches.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>machine learning</kwd>
        <kwd>bioinformatics</kwd>
        <kwd>information retrieval</kwd>
        <kwd>evidence-based medicine</kwd>
        <kwd>literature databases</kwd>
        <kwd>systematic review</kwd>
        <kwd>accuracy</kwd>
        <kwd>medical literature</kwd>
        <kwd>clinical support</kwd>
        <kwd>clinical care</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <sec>
        <title>Background and Significance</title>
        <p>Evidence-based medicine (EBM) is identified by three key elements: the best available clinical evidence, clinician expertise, and application of the evidence with consideration of patients’ circumstances, values, and preferences [<xref ref-type="bibr" rid="ref1">1</xref>]. EBM complements or reduces reliance on expert opinion with a coherent and structured framework for assessing and applying the best evidence to patient care decisions [<xref ref-type="bibr" rid="ref2">2</xref>]. An obvious and worsening barrier to the implementation of EBM is the continuously growing body of medical literature. According to the National Library of Medicine, over 900,000 new citations were indexed in MEDLINE in 2020, very few of which were relevant to or ready for clinical attention [<xref ref-type="bibr" rid="ref3">3</xref>]. Searching for the best clinical care evidence is a challenging task for researchers and clinicians, and facilitation of the search process is a necessity [<xref ref-type="bibr" rid="ref4">4</xref>].</p>
      </sec>
      <sec>
        <title>Search Filters</title>
        <p>Search filters, also referred to as hedges, allow researchers, clinicians, and librarians to retrieve evidence from bibliographic databases and journals by filtering searches to return reliable and specific articles to address clinical questions, produce systematic reviews, or inform clinical guidelines [<xref ref-type="bibr" rid="ref5">5</xref>]. MEDLINE search filters, for example, enable researchers to combine the use of free text with controlled vocabularies like Medical Subject Heading (MeSH) terms and other indexing features to improve search results targeting the clinical question at hand [<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref7">7</xref>]. There are search filters that focus on the purpose of a study and its methods or topical content areas [<xref ref-type="bibr" rid="ref8">8</xref>]. Topical search filters help identify articles based on particular clinical conditions using terms related to that condition [<xref ref-type="bibr" rid="ref8">8</xref>], while methodological search filters comprise terms that identify articles based on their research purpose [<xref ref-type="bibr" rid="ref9">9</xref>]. For example, the Hedges project, developed by the Health Information Research Unit at McMaster University, provides search filters for MEDLINE, PsycINFO, and EMBASE using the OVID syntax for a range of purpose categories of articles such as treatment, diagnosis, and prognosis and include methodological terms [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref11">11</xref>]. For searches seeking articles on a treatment (purpose), the search hedge includes methodological terms related to clinical or randomized controlled trials (RCTs), while the diagnosis search hedge includes methodological terms including sensitivity and specificity [<xref ref-type="bibr" rid="ref12">12</xref>].</p>
        <p>These search filters were developed to identify high-quality studies based on established critical appraisal criteria for methodological rigor [<xref ref-type="bibr" rid="ref13">13</xref>-<xref ref-type="bibr" rid="ref15">15</xref>]. This was done by annotating articles as meeting or not meeting criteria and using the annotated dataset to evaluate the performance of search terms to optimally retrieve the high-quality studies. For RCTs, applying the Cochrane risk for bias tool includes assessing randomization method, allocation concealment, follow-up data for at least 80% of participants, blinding of participants, and outcome assessors [<xref ref-type="bibr" rid="ref14">14</xref>]. For the Hedges project, the criteria applied to articles by purpose are available online [<xref ref-type="bibr" rid="ref15">15</xref>].</p>
        <p>Clinical search filters are intended to help clinicians, researchers, and policymakers quickly access relevant studies and systematic reviews in a way that can be tailored to the user’s demand [<xref ref-type="bibr" rid="ref8">8</xref>]. The filters differ in their sensitivity and specificity according to the terms used, databases searched, and precision of the filter [<xref ref-type="bibr" rid="ref16">16</xref>]. Some filters offer high specificity, which limits the proportion of off-target articles that are retrieved. This is useful for busy clinicians who value the most efficient use of their time in finding relevant evidence quickly. Search filters may also have the option to maximize sensitivity and identify all potentially relevant articles at the cost of including a higher proportion of off-target articles [<xref ref-type="bibr" rid="ref17">17</xref>], an approach more suited to the conduct of systematic literature reviews.</p>
        <p>Although search filters, such as Clinical Queries in PubMed, have been used since 1990 and have continued to work well over the years [<xref ref-type="bibr" rid="ref18">18</xref>], they have some limitations. One limitation is their partial dependence on MeSH indexing terms, as the process of indexing of articles within MEDLINE can take up to a year for some articles [<xref ref-type="bibr" rid="ref19">19</xref>]. For diagnostic studies, there is large variability in designs and methods, which may result in largely incomplete literature searches [<xref ref-type="bibr" rid="ref7">7</xref>]. When applied in the context of conducting a systematic review, the highly specific filters result in missing evidence [<xref ref-type="bibr" rid="ref7">7</xref>], and the high sensitivity search filters will only partially reduce the time-consuming task of screening retrieved titles and abstracts [<xref ref-type="bibr" rid="ref20">20</xref>].</p>
      </sec>
      <sec>
        <title>Overview of Machine Learning Applied for Text Processing</title>
        <p>Machine learning is a subset of artificial intelligence that refers to a series of computational methods using experience to improve performance or achieve accurate and precise predictions. Experience, in this context, refers to the information made available to the machine for the analysis [<xref ref-type="bibr" rid="ref21">21</xref>]. A more detailed definition was provided by Mitchell [<xref ref-type="bibr" rid="ref22">22</xref>]: “A computer program is said to learn from experience (E) with respect to some class of tasks (T) and performance measure (P), if its performance at tasks in T, as measured by P, improves with experience E.”</p>
        <p>Machine learning applications have become increasingly popular and essential in health care [<xref ref-type="bibr" rid="ref23">23</xref>], as the system generates an enormous amount of data every day [<xref ref-type="bibr" rid="ref24">24</xref>]. Machine learning can identify relevant relations in large health care–generated datasets and derive algorithms that generate accurate predictions [<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref26">26</xref>]. For example, machine learning has been used to predict the risk for nosocomial infection by leveraging data from electronic health records [<xref ref-type="bibr" rid="ref27">27</xref>-<xref ref-type="bibr" rid="ref29">29</xref>]. A machine learning classifier is a mathematical procedure responsible for identifying the patterns and performing the prediction task on the dataset, while a machine learning model is the output of the algorithm [<xref ref-type="bibr" rid="ref30">30</xref>]. A machine learning model represents the complete learning process including the training of the algorithm and the used set of features [<xref ref-type="bibr" rid="ref30">30</xref>].</p>
        <p>Another application of machine learning in the health care and biomedical literature is text mining, which refers to the discovery of previously unknown information from unstructured textual data [<xref ref-type="bibr" rid="ref31">31</xref>]. This is done by converting the text to structured analyzable data using natural language processing (NLP) [<xref ref-type="bibr" rid="ref32">32</xref>]. With the exponential increase in the amount of information available for clinicians and researchers, both in biomedical literature and electronic health records [<xref ref-type="bibr" rid="ref33">33</xref>], text mining has been applied for text summarization [<xref ref-type="bibr" rid="ref34">34</xref>], literature retrieval [<xref ref-type="bibr" rid="ref35">35</xref>], and evidence grading [<xref ref-type="bibr" rid="ref36">36</xref>]. Machine learning has also been applied to automate the screening process for systematic reviews, identifying relevant articles while decreasing workload and increasing efficiency [<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref37">37</xref>,<xref ref-type="bibr" rid="ref38">38</xref>]. Semantic analysis, the process of understanding text by interpreting meanings from the unstructured text [<xref ref-type="bibr" rid="ref39">39</xref>], has been applied to information extraction from the biomedical literature [<xref ref-type="bibr" rid="ref40">40</xref>].</p>
        <p>There are several types of machine learning determined by their mathematical approach [<xref ref-type="bibr" rid="ref41">41</xref>]. The basic machine learning strategies are supervised learning, unsupervised learning, and reinforced learning [<xref ref-type="bibr" rid="ref41">41</xref>,<xref ref-type="bibr" rid="ref42">42</xref>]. Supervised learning relies on a prelabeled training dataset to provide the machine with the necessary input to make accurate predictions [<xref ref-type="bibr" rid="ref41">41</xref>]. Decision tree (DT), naïve Bayes (NB), and support vector machine (SVM) are common supervised machine learning algorithms [<xref ref-type="bibr" rid="ref43">43</xref>]. Unsupervised learning does not use labeled data and is mainly used for structuring and organizing data rather than classification [<xref ref-type="bibr" rid="ref43">43</xref>]. In reinforced learning, the algorithm learns by reacting to its environment and reaches predictions via a reward system [<xref ref-type="bibr" rid="ref42">42</xref>]. A common machine learning technique is ensemble learning, which combines more than one classifier to perform an individual prediction task. Boosting is one of the commonly used ensemble learners, which combines multiple weak classifiers and converts them into one strong classifier [<xref ref-type="bibr" rid="ref41">41</xref>]. Neural networks are multilayer mathematical structures consisting of an input layer, an output layer, and a hidden layer (commonly more than one layer) in between [<xref ref-type="bibr" rid="ref44">44</xref>]. In each layer a series of calculations occurs, leading to better performance [<xref ref-type="bibr" rid="ref44">44</xref>]. Due to the multilayer nature of neural networks, their field of study is known as deep learning. Neural networks can be supervised, unsupervised, or reinforced [<xref ref-type="bibr" rid="ref45">45</xref>].</p>
        <p>Another appealing application of machine learning approaches to the biomedical literature is to improve retrieval of clinically relevant articles, building on and hopefully overcoming the limitation faced by Boolean searching. Several studies have been conducted to assess the performance of machine learning classifiers to identify specific categories of published articles. For example, Marshall and colleagues [<xref ref-type="bibr" rid="ref46">46</xref>] applied machine learning to identify RCTs. Del Fiol and colleagues [<xref ref-type="bibr" rid="ref35">35</xref>] used machine learning to extract only scientifically sound treatment studies from PubMed. However, no systematic review of studies objectively assessing the performance of such machine learning models, ideally comparing their performance to traditional evidence retrieval methods such as validated Boolean search filters or manual critical appraisal by experts in the field, has been performed to date. Such a systematic review would be of critical value in driving future machine learning research aimed at improving the delivery of relevant evidence to the point of care.</p>
      </sec>
      <sec>
        <title>Objective</title>
        <p>The objective of this systematic review is to summarize the nature (methods and approaches) and comparative performance (eg, recall and precision) of machine learning approaches that have been applied to retrieve high-quality evidence for clinical consideration from the biomedical literature. High-quality is defined as articles that meet established methodological critical appraisal criteria, with annotated datasets that apply these criteria considered the gold standard.</p>
      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <p>The following subsections describe in detail the steps that were conducted to identify, screen, and abstract data from the included studies.</p>
      <sec>
        <title>Search Strategies</title>
        <p>Nine databases were searched from inception to July 8, 2020, to identify relevant articles: Web of Science (title, abstract); MEDLINE; Embase; PsychINFO (title, abstract, keyword, subject terms); Wiley Online Library; ScienceDirect (title, abstract, keyword); CINAHL; IEEE (title, abstract, keywords), and Association of Computer Machinery digital library (title, abstract). The Multidisciplinary Digital Publishing Institute (title, abstract) database was searched on November 17, 2020. The search strategy was developed with a librarian (TN). Search terms related to 4 concepts—machine learning, literature retrieval, high research quality, and biomedical literature—were combined using the AND Boolean operator. The OVID MEDLINE search included the following terms, which were translated for the other databases (mp = multipurpose, searching within the title, original title, abstract, subject heading, name of substance, and registry word fields):</p>
        <list list-type="bullet">
          <list-item>
            <p>Machine learning: (neural networks/ or machine learning/ or natural language processing/ or data mining/ or support vector machine/ or (“text categorization” or “text classification” or “text analysis” or “literature mining” or “text mining”).mp)</p>
          </list-item>
          <list-item>
            <p>Study objective or goal: (“Abstracting and Indexing”/ or “information storage and retrieval”/ or (“article retrieval” or “literature surveillance” or “literature screening” or “article screening” or “evidence search” or “evidence screening” or “evidence review” or “information retrieval” or “literature survey” or “document classification” or “review efficiency” or “citation screening” or “literature databases”).mp.)</p>
          </list-item>
          <list-item>
            <p>High-quality: (“Sensitivity and Specificity”/ or evidence-based medicine/ or (“quality” or “evidence” or “high-quality” or “clinical trial” or “random*” or “randomized controlled trial” or “sensitivity or specificity” or “accuracy” or “precision”).mp.)</p>
          </list-item>
        </list>
        <p>In the Association of Computer Machinery digital library and Multidisciplinary Digital Publishing Institute search queries, terms related to the biomedical literature were included: (“PubMed” or “MEDLINE” or “medical literature” or “Biomedical literature”).</p>
      </sec>
      <sec>
        <title>Study Selection</title>
        <p>Articles retrieved by our search queries were collected in a single Research Information Systems file using JabRef software. Deduplication was conducted using both JabRef automatic deduping and Covidence automatic deduplication. We included articles that met the following criteria:</p>
        <list list-type="bullet">
          <list-item>
            <p>Reported on the use of a machine learning approach for the retrieval of single studies or systematic reviews concerning the management of health care problems in large biomedical bibliographic databases such as MEDLINE and EMBASE</p>
          </list-item>
          <list-item>
            <p>Classified retrieved articles based on quality (using a gold standard)</p>
          </list-item>
          <list-item>
            <p>Used a textual analysis machine learning approach</p>
          </list-item>
          <list-item>
            <p>Evaluated the performance of the machine learning approach (ie, they present a comparison of retrieval methods or other ways of appraising the performance of the machine learning approach)</p>
          </list-item>
          <list-item>
            <p>Conducted within the biomedical literature domain</p>
          </list-item>
          <list-item>
            <p>Published in the English language</p>
          </list-item>
        </list>
      </sec>
      <sec>
        <title>Abstract and Full-Text Screening</title>
        <p>Titles and abstracts of all the retrieved articles were screened independently in Covidence.org by two members of the study team. Articles were assessed as relevant, irrelevant, or maybe relevant. The full texts of relevant and maybe relevant articles were then reviewed in duplicate, with conflicts adjudicated by a third team member.</p>
      </sec>
      <sec>
        <title>Data Extraction</title>
        <p>A data extraction spreadsheet was developed to gather data regarding the methods of the machine learning approaches as detailed by the survey by Agarwal and Mittal [<xref ref-type="bibr" rid="ref47">47</xref>] and included details on preprocessing steps, text representation, feature selection, feature extraction, and classifiers used. Additionally, we extracted data specific to the retrieval of high-quality articles such as the quality gold standard, the comparators used to test the machine learning models, and the performance of the developed algorithms.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Study Selection</title>
        <p>Our search queries retrieved 3918 articles after 472 duplicates were removed; 3632 were excluded during the title and abstract screening for not applying a machine learning approach to biomedical articles. A total of 286 were selected for full-text screening, and 10 articles met our eligibility criteria (<xref rid="figure1" ref-type="fig">Figure 1</xref>) [<xref ref-type="bibr" rid="ref48">48</xref>]. Due to the heterogeneity in the population (retrieved articles), index method (machine learning algorithm used), gold standard, and outcomes (definition of high-quality study), we did not perform a quantitative synthesis of the results.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>PRISMA flow diagram of the studies identification process for the systematic review [<xref ref-type="bibr" rid="ref48">48</xref>].</p>
          </caption>
          <graphic xlink:href="medinform_v9i9e30401_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Quality Gold Standard</title>
        <p>Each study used a quality gold standard database of original studies or systematic reviews that were manually reviewed and annotated by experts based on their scientific soundness and clinical relevance (<xref ref-type="table" rid="table1">Table 1</xref>). Datasets of articles that met or did not meet standards for quality and relevance were used to train the machine learning models. Four studies used the American College of Physicians (ACP) Journal Club as their quality gold standard [<xref ref-type="bibr" rid="ref49">49</xref>-<xref ref-type="bibr" rid="ref52">52</xref>], 3 studies used the Clinical Hedges dataset [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref53">53</xref>], 2 studies considered articles that were included in treatment clinical guidelines as high quality [<xref ref-type="bibr" rid="ref54">54</xref>,<xref ref-type="bibr" rid="ref55">55</xref>], and 1 article used the Cochrane Library as their gold standard [<xref ref-type="bibr" rid="ref56">56</xref>].</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>The quality standard used as the training dataset for developing the classifiers in the included studies.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="330"/>
            <col width="670"/>
            <thead>
              <tr valign="top">
                <td>Author</td>
                <td>Quality gold standard</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Aphinyanaphongs et al [<xref ref-type="bibr" rid="ref49">49</xref>]</td>
                <td>ACP<sup>a</sup> Journal Club (treatment class)<sup>b</sup></td>
              </tr>
              <tr valign="top">
                <td>Aphinyanaphongs et al [<xref ref-type="bibr" rid="ref50">50</xref>]</td>
                <td>ACP Journal Club (treatment, diagnosis, etiology, prognosis)<sup>b</sup></td>
              </tr>
              <tr valign="top">
                <td>Aphinyanaphongs et al [<xref ref-type="bibr" rid="ref51">51</xref>]</td>
                <td>ACP Journal Club (treatment, diagnosis, etiology, prognosis)<sup>b</sup></td>
              </tr>
              <tr valign="top">
                <td>Kilicoglu et al [<xref ref-type="bibr" rid="ref53">53</xref>]</td>
                <td>Clinical Hedges<sup>b</sup></td>
              </tr>
              <tr valign="top">
                <td>Lin et al [<xref ref-type="bibr" rid="ref52">52</xref>]</td>
                <td>ACP Journal Club (unspecified classes of articles)<sup>b</sup></td>
              </tr>
              <tr valign="top">
                <td>Afzal et al [<xref ref-type="bibr" rid="ref36">36</xref>]</td>
                <td>Clinical Hedges<sup>b</sup></td>
              </tr>
              <tr valign="top">
                <td>Bian et al [<xref ref-type="bibr" rid="ref54">54</xref>]</td>
                <td>Articles cited in 11 clinical guidelines on the treatment of cardiac, autoimmune, and respiratory diseases</td>
              </tr>
              <tr valign="top">
                <td>Del Fiol et al [<xref ref-type="bibr" rid="ref35">35</xref>]</td>
                <td>Clinical Hedges<sup>b</sup></td>
              </tr>
              <tr valign="top">
                <td>Bian et al [<xref ref-type="bibr" rid="ref55">55</xref>]</td>
                <td>Articles cited in 11 clinical guidelines on the treatment of cardiac, autoimmune, and respiratory diseases</td>
              </tr>
              <tr valign="top">
                <td>Afzal et al [<xref ref-type="bibr" rid="ref56">56</xref>]</td>
                <td>Cochrane Library Reviews</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>ACP: American College of Physicians.</p>
            </fn>
            <fn id="table1fn2">
              <p><sup>b</sup>Hand searches of articles from approximately 125 clinical journals that were assessed by critical appraisal criteria; articles meeting criteria were then judged by clinicians for clinical relevance. ACP Journal Club includes additional reviews by clinicians.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Preprocessing Methods</title>
        <p>A matrix of the preprocessing steps that were applied to the dataset before developing the classifiers as reported in the included studies is presented in <xref ref-type="table" rid="table2">Table 2</xref>. Seven of the included studies provided details of their preprocessing steps [<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref49">49</xref>-<xref ref-type="bibr" rid="ref51">51</xref>,<xref ref-type="bibr" rid="ref53">53</xref>,<xref ref-type="bibr" rid="ref56">56</xref>], which included the conversion of text to lowercase, word-stemming, and removal of stop words. Additionally, 6 studies applied a term weighting method [<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref49">49</xref>-<xref ref-type="bibr" rid="ref51">51</xref>,<xref ref-type="bibr" rid="ref53">53</xref>,<xref ref-type="bibr" rid="ref56">56</xref>] to express the importance of a word in each document based on its frequency. Afzal et al [<xref ref-type="bibr" rid="ref36">36</xref>] used vocabulary pruning by removing off topic-specific frequent terms and rarely occurring terms. Three studies did not specify the steps for their preprocessing steps [<xref ref-type="bibr" rid="ref52">52</xref>,<xref ref-type="bibr" rid="ref54">54</xref>,<xref ref-type="bibr" rid="ref55">55</xref>].</p>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Preprocessing steps applied to article data for preparing the datasets for machine learning algorithm development.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="190"/>
            <col width="130"/>
            <col width="140"/>
            <col width="100"/>
            <col width="130"/>
            <col width="150"/>
            <col width="160"/>
            <thead>
              <tr valign="top">
                <td>Author</td>
                <td>Text converted to lowercase</td>
                <td>Removal of punctuation</td>
                <td>Removal of stop words</td>
                <td>Porter- stemming</td>
                <td>Weighting method</td>
                <td>Unique preprocessing considered</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Aphinyanaphongs et al [<xref ref-type="bibr" rid="ref49">49</xref>]</td>
                <td>✓<sup>a</sup></td>
                <td>✓</td>
                <td>✓</td>
                <td>✓</td>
                <td>Log frequency with redundancy</td>
                <td>NR<sup>b</sup></td>
              </tr>
              <tr valign="top">
                <td>Aphinyanaphongs et al [<xref ref-type="bibr" rid="ref50">50</xref>]</td>
                <td>✓</td>
                <td>✓</td>
                <td>✓</td>
                <td>✓</td>
                <td>Log frequency with redundancy</td>
                <td>NR</td>
              </tr>
              <tr valign="top">
                <td>Aphinyanaphongs et al [<xref ref-type="bibr" rid="ref51">51</xref>]</td>
                <td>✓</td>
                <td>✓</td>
                <td>✓</td>
                <td>✓</td>
                <td>Log frequency with redundancy</td>
                <td>Removed infrequent words</td>
              </tr>
              <tr valign="top">
                <td>Kilicoglu et al [<xref ref-type="bibr" rid="ref53">53</xref>]</td>
                <td>✓</td>
                <td>NR</td>
                <td>✓</td>
                <td>✓</td>
                <td>Information gain measure</td>
                <td>Removed infrequent words</td>
              </tr>
              <tr valign="top">
                <td>Lin et al [<xref ref-type="bibr" rid="ref52">52</xref>]</td>
                <td>NR</td>
                <td>NR</td>
                <td>NR</td>
                <td>NR</td>
                <td>NR</td>
                <td>NR</td>
              </tr>
              <tr valign="top">
                <td>Afzal et al [<xref ref-type="bibr" rid="ref36">36</xref>]</td>
                <td>✓</td>
                <td>NR</td>
                <td>✓</td>
                <td>✓</td>
                <td>TF-IDF<sup>c</sup></td>
                <td>Vocabulary pruning</td>
              </tr>
              <tr valign="top">
                <td>Bian et al [<xref ref-type="bibr" rid="ref54">54</xref>]</td>
                <td>NR</td>
                <td>NR</td>
                <td>NR</td>
                <td>NR</td>
                <td>NR</td>
                <td>NR</td>
              </tr>
              <tr valign="top">
                <td>Del Fiol et al [<xref ref-type="bibr" rid="ref35">35</xref>]</td>
                <td>✓</td>
                <td>NR</td>
                <td>✓</td>
                <td>NR</td>
                <td>NR</td>
                <td>Removed articles without abstracts, concatenated title, and abstract words</td>
              </tr>
              <tr valign="top">
                <td>Bian et al [<xref ref-type="bibr" rid="ref55">55</xref>]</td>
                <td>NR</td>
                <td>NR</td>
                <td>NR</td>
                <td>NR</td>
                <td>NR</td>
                <td>NR</td>
              </tr>
              <tr valign="top">
                <td>Afzal et al [<xref ref-type="bibr" rid="ref56">56</xref>]</td>
                <td>✓</td>
                <td>NR</td>
                <td>NR</td>
                <td>NR</td>
                <td>TF-IDF</td>
                <td>Removed articles with missing values</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table2fn1">
              <p><sup>a</sup>Applied.</p>
            </fn>
            <fn id="table2fn2">
              <p><sup>b</sup>NR: not reported.</p>
            </fn>
            <fn id="table2fn3">
              <p><sup>c</sup>TF-IDF: term frequency–inverse document frequency.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Feature Selection</title>
        <p>Most of the included articles relied on the text as their features (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). Seven articles used words from titles and abstracts as their features [<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref49">49</xref>-<xref ref-type="bibr" rid="ref51">51</xref>,<xref ref-type="bibr" rid="ref53">53</xref>,<xref ref-type="bibr" rid="ref56">56</xref>]. Kilicoglu et al [<xref ref-type="bibr" rid="ref53">53</xref>] and Afzal et al [<xref ref-type="bibr" rid="ref36">36</xref>] used article metadata features, Unified Medical Language System features, SemRep semantic prediction, and MeSH terms in combination with the words of titles and abstracts features. Lin et al [<xref ref-type="bibr" rid="ref52">52</xref>] selected specific features from the citation dataset: journal impact factor, MeSH terms, sample size, <italic>P</italic> value, and confidence intervals. Bian et al [<xref ref-type="bibr" rid="ref54">54</xref>,<xref ref-type="bibr" rid="ref55">55</xref>] relied on MEDLINE metadata as well as bibliometric features, which included citation count, journal impact factor, number of comments on PubMed, Altmetric score, study sample size, registration in ClinicalTrials.gov, and article age, and assessed how each feature contributed to the classification. The experiment by Bian et al [<xref ref-type="bibr" rid="ref55">55</xref>] used only time-agnostic features (features available at the time of an article’s publication), which are journal impact factor, sample size, number of grants, number of authors, number of clinically useful sentences, scientific impact of authors’ institution, numbers of references, page count, registration in ClinicalTrials.gov, and publication in PubMed Central. Afzal et al [<xref ref-type="bibr" rid="ref56">56</xref>] used automatic feature engineering with RapidMiner software for the title and abstract text feature extraction as part of the multilayer perceptron model.</p>
      </sec>
      <sec>
        <title>Machine Learning Classifier</title>
        <p>The majority of the included studies developed multiple algorithms and selected the top-performing one for their main classification tasks (<xref ref-type="table" rid="table3">Table 3</xref>). Aphinyanaphongs et al [<xref ref-type="bibr" rid="ref49">49</xref>,<xref ref-type="bibr" rid="ref50">50</xref>], initially reported their results using SVM, NB, and boosting algorithms in both their 2003 and 2005 experiments; however, they ended up selecting SVM as their top-performing classifier in a separate study [<xref ref-type="bibr" rid="ref51">51</xref>]. Bian et al [<xref ref-type="bibr" rid="ref54">54</xref>,<xref ref-type="bibr" rid="ref55">55</xref>] and Afzal et al [<xref ref-type="bibr" rid="ref36">36</xref>] compared the performance of multiple classifiers (SVM, NB, DT, k-nearest neighbors, random forest, multilayer perceptron) and selected the best performing for their experiment in the context of the same study (NB, DT, and SVM, respectively). We refer to the classifier that was selected for the classification task as the main classifier.</p>
        <p>From the included articles, SVM was the most used classifier. Five studies used an SVM algorithm as one of their main experiment classifiers (<xref ref-type="table" rid="table3">Table 3</xref>), 2 studies used a neural network as their main classifier; Del Fiol et al [<xref ref-type="bibr" rid="ref35">35</xref>] used a convolutional neural network (CNN), while Afzal et al [<xref ref-type="bibr" rid="ref56">56</xref>] used a multilayer feed-forward artificial neural network (ANN). DT algorithms were used in 2 studies for their main text classification function [<xref ref-type="bibr" rid="ref52">52</xref>,<xref ref-type="bibr" rid="ref55">55</xref>]. Four of the included studies applied multiple classifying approaches [<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref49">49</xref>,<xref ref-type="bibr" rid="ref50">50</xref>,<xref ref-type="bibr" rid="ref53">53</xref>].</p>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Types of machine learning classifiers used in the main experiment to assess performance in each of the included studies.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="200"/>
            <col width="130"/>
            <col width="130"/>
            <col width="140"/>
            <col width="140"/>
            <col width="130"/>
            <col width="130"/>
            <thead>
              <tr valign="top">
                <td>Author</td>
                <td>Naïve Bayes</td>
                <td>SVM<sup>a</sup></td>
                <td>Decision tree</td>
                <td colspan="2">Ensemble</td>
                <td>Neural network</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  Boosting
                </td>
                <td>
                  Stacking
                </td>
                <td>
                  <break/>
                </td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Aphinyanaphongs et al [<xref ref-type="bibr" rid="ref49">49</xref>]</td>
                <td>✓<sup>b</sup></td>
                <td>✓</td>
                <td>N/A<sup>c</sup></td>
                <td>✓</td>
                <td>N/A</td>
                <td>N/A</td>
              </tr>
              <tr valign="top">
                <td>Aphinyanaphongs et al [<xref ref-type="bibr" rid="ref50">50</xref>]</td>
                <td>✓</td>
                <td>✓</td>
                <td>N/A</td>
                <td>✓</td>
                <td>N/A</td>
                <td>N/A</td>
              </tr>
              <tr valign="top">
                <td>Aphinyanaphongs et al [<xref ref-type="bibr" rid="ref51">51</xref>]</td>
                <td>N/A</td>
                <td>✓</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>N/A</td>
              </tr>
              <tr valign="top">
                <td>Kilicoglu et al [<xref ref-type="bibr" rid="ref53">53</xref>]</td>
                <td>✓</td>
                <td>✓</td>
                <td>N/A</td>
                <td>✓</td>
                <td>✓</td>
                <td>N/A</td>
              </tr>
              <tr valign="top">
                <td>Lin et al [<xref ref-type="bibr" rid="ref52">52</xref>]</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>✓</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>N/A</td>
              </tr>
              <tr valign="top">
                <td>Afzal et al [<xref ref-type="bibr" rid="ref36">36</xref>]</td>
                <td>N/A</td>
                <td>✓</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>N/A</td>
              </tr>
              <tr valign="top">
                <td>Bian et al [<xref ref-type="bibr" rid="ref54">54</xref>]</td>
                <td>✓</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>N/A</td>
              </tr>
              <tr valign="top">
                <td>Del Fiol et al [<xref ref-type="bibr" rid="ref35">35</xref>]</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>✓</td>
              </tr>
              <tr valign="top">
                <td>Bian et al [<xref ref-type="bibr" rid="ref55">55</xref>]</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>✓</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>N/A</td>
              </tr>
              <tr valign="top">
                <td>Afzal et al [<xref ref-type="bibr" rid="ref56">56</xref>]</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>✓</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table3fn1">
              <p><sup>a</sup>SVM: support vector machine.</p>
            </fn>
            <fn id="table3fn2">
              <p><sup>b</sup>Applied.</p>
            </fn>
            <fn id="table3fn3">
              <p><sup>c</sup>Not applied.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Comparator for Evaluating the Performance of the Classifiers</title>
        <p>As per our inclusion criteria, to evaluate the performance of the machine learning method to classify articles appropriately, articles had to report a comparison of their applied machine learning model to a gold standard method such as gold standard high-quality articles retrieval method, for example, search filters, a manually annotated high-quality articles’ dataset, or a baseline machine learning model for high-quality articles retrieval (<xref ref-type="table" rid="table4">Table 4</xref>). Aphinyanaphongs et al [<xref ref-type="bibr" rid="ref49">49</xref>-<xref ref-type="bibr" rid="ref51">51</xref>] used Clinical Query filters with sensitivity and specificity optimization [<xref ref-type="bibr" rid="ref57">57</xref>]. The experiment conducted by Kilicoglu et al [<xref ref-type="bibr" rid="ref53">53</xref>] evaluated their machine learning approach by applying it in a new dataset annotated by experts. The NB high-quality algorithm by Kilicoglu et al [<xref ref-type="bibr" rid="ref53">53</xref>] was considered a comparator on its own for its high recall and was used as such by Bian and colleagues [<xref ref-type="bibr" rid="ref54">54</xref>,<xref ref-type="bibr" rid="ref55">55</xref>], who also used PubMed’s best match as a comparator. Lin et al [<xref ref-type="bibr" rid="ref52">52</xref>] used accuracy and k-value performance metrics in comparison to the results of the critical appraisal process by experts in the field. Also, Lin et al [<xref ref-type="bibr" rid="ref52">52</xref>] has applied a comparison between their classifier, which was a DT, to other known text classifiers like SVM and ANN. Afzal et al [<xref ref-type="bibr" rid="ref36">36</xref>] have used a SVM model for quality articles retrieval and compared its performance to the SVM model proposed by Sarker et al [<xref ref-type="bibr" rid="ref58">58</xref>], reporting that their classifier achieved a higher performance with their reported features selected.</p>
        <p>Del Fiol et al [<xref ref-type="bibr" rid="ref35">35</xref>] was the first study to incorporate the use of deep learning in quality articles retrieval, relying on a CNN. Del Fiol and colleagues [<xref ref-type="bibr" rid="ref35">35</xref>] compared their proposed classifier to the PubMed Clinical Queries broad filter since it achieves a nearly perfect recall. Also, they compared their proposed model to McMaster textword search and McMaster balanced search filter created by the Clinical Hedges group to evaluate the capabilities of their model of retrieving recently published evidence and achieving a balance between recall and precision [<xref ref-type="bibr" rid="ref35">35</xref>]. Afzal et al [<xref ref-type="bibr" rid="ref36">36</xref>], in their experiment using ANN, compared their model’s results to the CNN results of Del Fiol et al [<xref ref-type="bibr" rid="ref35">35</xref>], the DT results of Bian et al [<xref ref-type="bibr" rid="ref55">55</xref>], and their prior experiment using an SVM for quality articles retrieval [<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref56">56</xref>]. Also, Afzal et al [<xref ref-type="bibr" rid="ref56">56</xref>] compared their proposed ANN to well-known algorithms used in the literature like NB, SVM, DT, and gradient boosted trees.</p>
        <table-wrap position="float" id="table4">
          <label>Table 4</label>
          <caption>
            <p>The gold standard comparator used for evaluating machine learning models in the included studies.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="330"/>
            <col width="670"/>
            <thead>
              <tr valign="top">
                <td>Author</td>
                <td>Comparator</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Aphinyanaphongs et al [<xref ref-type="bibr" rid="ref49">49</xref>-<xref ref-type="bibr" rid="ref51">51</xref>]</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>PubMed Clinical Query filter [<xref ref-type="bibr" rid="ref57">57</xref>]</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>Kilicoglu et al [<xref ref-type="bibr" rid="ref53">53</xref>]</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Testing dataset of 2000 articles annotated by experts (held-out testing dataset to test model’s generalization)</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>Lin et al [<xref ref-type="bibr" rid="ref52">52</xref>]</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Critical appraisal by domain expert</p>
                    </list-item>
                    <list-item>
                      <p>SVM<sup>a</sup></p>
                    </list-item>
                    <list-item>
                      <p>Artificial neural network</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>Afzal et al [<xref ref-type="bibr" rid="ref36">36</xref>]</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>SVM proposed in Sarker et al [<xref ref-type="bibr" rid="ref58">58</xref>]</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>Bian et al [<xref ref-type="bibr" rid="ref54">54</xref>]</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Kilicoglu [<xref ref-type="bibr" rid="ref53">53</xref>] high-quality classifier</p>
                    </list-item>
                    <list-item>
                      <p>PubMed’s relevance sort</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>Del Fiol et al [<xref ref-type="bibr" rid="ref35">35</xref>]</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>PubMed Clinical Query filter</p>
                    </list-item>
                    <list-item>
                      <p>McMaster textword search</p>
                    </list-item>
                    <list-item>
                      <p>McMaster balanced filter</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>Bian et al [<xref ref-type="bibr" rid="ref55">55</xref>]</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Kilicoglu et al [<xref ref-type="bibr" rid="ref53">53</xref>] high-quality classifier</p>
                    </list-item>
                    <list-item>
                      <p>PubMed relevance sort</p>
                    </list-item>
                    <list-item>
                      <p>High-impact classifier with time-sensitive features included by Bian et al [<xref ref-type="bibr" rid="ref54">54</xref>]</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>Afzal et al [<xref ref-type="bibr" rid="ref56">56</xref>]</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Well-known algorithms used in the literature: NB<sup>b</sup>, SVM, DT<sup>c</sup>, GBT<sup>d</sup></p>
                    </list-item>
                    <list-item>
                      <p>Models from past research by Del Fiol et al [<xref ref-type="bibr" rid="ref35">35</xref>], Afzal et al [<xref ref-type="bibr" rid="ref36">36</xref>], and Bian et al [<xref ref-type="bibr" rid="ref55">55</xref>]</p>
                    </list-item>
                  </list>
                </td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table4fn1">
              <p><sup>a</sup>SVM: support vector machine.</p>
            </fn>
            <fn id="table4fn2">
              <p><sup>b</sup>NB: naïve Bayes.</p>
            </fn>
            <fn id="table4fn3">
              <p><sup>c</sup>DT: decision tree.</p>
            </fn>
            <fn id="table4fn4">
              <p><sup>d</sup>GBT: gradient boosted trees.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Performance Metrics</title>
        <p>All included articles applied a supervised machine learning model. Validation by applying a resampling k-fold approach was used in 7 studies. Five used 10-fold cross-validation [<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref49">49</xref>,<xref ref-type="bibr" rid="ref52">52</xref>,<xref ref-type="bibr" rid="ref53">53</xref>], and 2 studies relied on 5-fold cross-validation [<xref ref-type="bibr" rid="ref50">50</xref>,<xref ref-type="bibr" rid="ref51">51</xref>]. The most common performance metrics used in the included studies were sensitivity (recall), specificity, accuracy, area under the curve (AUC), F-measure, and precision (<xref ref-type="table" rid="table5">Table 5</xref>). The recall was generally high, above 85%, across all experiment classifiers except the SVM by Kilicoglu et al [<xref ref-type="bibr" rid="ref53">53</xref>], and the NB and DT reported by Bian et al [<xref ref-type="bibr" rid="ref54">54</xref>] and Bian et al [<xref ref-type="bibr" rid="ref55">55</xref>], respectively, as both had a recall below 30%. Precision ranged from 9% to 86%, with the neural network of Afzal et al [<xref ref-type="bibr" rid="ref56">56</xref>] and the SVM by Kilicoglu et al [<xref ref-type="bibr" rid="ref53">53</xref>] the highest. AUC was measured in all studies and ranged from 0.73 to 0.99. Lin et al [<xref ref-type="bibr" rid="ref52">52</xref>] and Bian et al [<xref ref-type="bibr" rid="ref54">54</xref>,<xref ref-type="bibr" rid="ref55">55</xref>] used novel performance metrics in their approaches. In the 2 studies by Bian and colleagues [<xref ref-type="bibr" rid="ref54">54</xref>,<xref ref-type="bibr" rid="ref55">55</xref>], performance was primarily determined by calculating the top 20 precision which is the measure of the percentage of true positive citations among the first 20 retrieved citations. Lin et al [<xref ref-type="bibr" rid="ref52">52</xref>] used Cohen kappa (k-value) as their performance metric, which is the agreement between machine performance (observed value) and gold standard (expected value) [<xref ref-type="bibr" rid="ref59">59</xref>,<xref ref-type="bibr" rid="ref60">60</xref>]. Bian et al [<xref ref-type="bibr" rid="ref54">54</xref>,<xref ref-type="bibr" rid="ref55">55</xref>] reported a top 20 precision of 34% with their 2017 NB classifier and 24% in their 2019 experiment using a DT classifier. Lin et al [<xref ref-type="bibr" rid="ref52">52</xref>] reported a k-value of 0.78 in their experiment.</p>
        <table-wrap position="float" id="table5">
          <label>Table 5</label>
          <caption>
            <p>Highest reported performance characteristics of the main classifier algorithms reported in the included studies.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="220"/>
            <col width="130"/>
            <col width="0"/>
            <col width="130"/>
            <col width="130"/>
            <col width="0"/>
            <col width="120"/>
            <col width="0"/>
            <col width="120"/>
            <col width="0"/>
            <col width="120"/>
            <thead>
              <tr valign="bottom">
                <td colspan="2">Classifier and author</td>
                <td colspan="2">Recall<sup>a</sup></td>
                <td>Specificity<sup>b</sup></td>
                <td colspan="2">Precision<sup>c</sup></td>
                <td colspan="2">F-score<sup>d</sup></td>
                <td colspan="2">AUC<sup>e</sup></td>
                <td>Accuracy<sup>f</sup></td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="12">
                  <bold>Support vector machine</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Aphinyanaphongs et al [<xref ref-type="bibr" rid="ref49">49</xref>]</td>
                <td>0.967</td>
                <td colspan="2">0.87</td>
                <td>0.169</td>
                <td colspan="2">0.29<sup>g</sup></td>
                <td colspan="2">0.98</td>
                <td colspan="2">0.893</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Aphinyanaphongs et al [<xref ref-type="bibr" rid="ref50">50</xref>]</td>
                <td>0.96</td>
                <td colspan="2">0.86</td>
                <td>0.18</td>
                <td colspan="2">0.30<sup>g</sup></td>
                <td colspan="2">0.97</td>
                <td colspan="2">NR<sup>h</sup></td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Aphinyanaphongs et al [<xref ref-type="bibr" rid="ref51">51</xref>]</td>
                <td>0.98</td>
                <td colspan="2">0.88</td>
                <td>0.305</td>
                <td colspan="2">0.47<sup>g</sup></td>
                <td colspan="2">0.95</td>
                <td colspan="2">NR</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Kilicoglu et al [<xref ref-type="bibr" rid="ref53">53</xref>]</td>
                <td>0.229</td>
                <td colspan="2">NR</td>
                <td>0.865</td>
                <td colspan="2">0.36</td>
                <td colspan="2">0.96</td>
                <td colspan="2">NR</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Afzal et al [<xref ref-type="bibr" rid="ref36">36</xref>]</td>
                <td>NR</td>
                <td colspan="2">NR</td>
                <td>NR</td>
                <td colspan="2">0.87</td>
                <td colspan="2">0.73</td>
                <td colspan="2">0.785</td>
              </tr>
              <tr valign="top">
                <td colspan="12">
                  <bold>Naïve Bayes</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Aphinyanaphongs et al [<xref ref-type="bibr" rid="ref49">49</xref>]</td>
                <td>0.967</td>
                <td colspan="2">0.76</td>
                <td>0.091</td>
                <td colspan="2">0.17<sup>g</sup></td>
                <td colspan="2">0.95</td>
                <td colspan="2">0.787</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Aphinyanaphongs et al [<xref ref-type="bibr" rid="ref50">50</xref>]</td>
                <td>NR</td>
                <td colspan="2">NR</td>
                <td>NR</td>
                <td colspan="2">NR</td>
                <td colspan="2">0.95</td>
                <td colspan="2">NR</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Kilicoglu et al [<xref ref-type="bibr" rid="ref53">53</xref>]</td>
                <td>0.975</td>
                <td colspan="2">NR</td>
                <td>0.138</td>
                <td colspan="2">0.24</td>
                <td colspan="2">0.82</td>
                <td colspan="2">NR</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Bian et al [<xref ref-type="bibr" rid="ref54">54</xref>]</td>
                <td>0.23</td>
                <td colspan="2">NR</td>
                <td>0.33</td>
                <td colspan="2">0.21</td>
                <td colspan="2">NR</td>
                <td colspan="2">NR</td>
              </tr>
              <tr valign="top">
                <td colspan="12">
                  <bold>Boosting</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Aphinyanaphongs et al [<xref ref-type="bibr" rid="ref49">49</xref>]</td>
                <td>0.967</td>
                <td colspan="2">0.786</td>
                <td>0.099</td>
                <td colspan="2">0.18<sup>g</sup></td>
                <td colspan="2">0.96</td>
                <td colspan="2">0.804</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Aphinyanaphongs et al [<xref ref-type="bibr" rid="ref50">50</xref>]</td>
                <td>NR</td>
                <td colspan="2">NR</td>
                <td>NR</td>
                <td colspan="2">NR</td>
                <td colspan="2">0.94</td>
                <td colspan="2">NR</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Kilicoglu et al [<xref ref-type="bibr" rid="ref53">53</xref>]</td>
                <td>0.729</td>
                <td colspan="2">NR</td>
                <td>0.823</td>
                <td colspan="2">0.77</td>
                <td colspan="2">0.97</td>
                <td colspan="2">NR</td>
              </tr>
              <tr valign="top">
                <td colspan="12">
                  <bold>Neural network</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Del Fiol et al [<xref ref-type="bibr" rid="ref35">35</xref>]</td>
                <td>0.969</td>
                <td colspan="2">NR</td>
                <td>0.346</td>
                <td colspan="2">0.51</td>
                <td colspan="2">NR</td>
                <td colspan="2">NR</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Afzal et al [<xref ref-type="bibr" rid="ref56">56</xref>]</td>
                <td>0.951</td>
                <td colspan="2">NR</td>
                <td>0.863</td>
                <td colspan="2">0.9</td>
                <td colspan="2">0.99</td>
                <td colspan="2">0.973</td>
              </tr>
              <tr valign="top">
                <td colspan="12">
                  <bold>Decision tree</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Lin et al [<xref ref-type="bibr" rid="ref52">52</xref>]</td>
                <td>NR</td>
                <td colspan="2">NR</td>
                <td>NR</td>
                <td colspan="2">NR</td>
                <td colspan="2">NR</td>
                <td colspan="2">0.854</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Bian et al [<xref ref-type="bibr" rid="ref55">55</xref>]</td>
                <td>0.09</td>
                <td colspan="2">NR</td>
                <td>0.39</td>
                <td colspan="2">0.14</td>
                <td colspan="2">NR</td>
                <td colspan="2">NR</td>
              </tr>
              <tr valign="top">
                <td colspan="12">
                  <bold>Stacking</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Kilicoglu et al [<xref ref-type="bibr" rid="ref53">53</xref>]</td>
                <td>0.864</td>
                <td colspan="2">NR</td>
                <td>0.747</td>
                <td colspan="2">0.801</td>
                <td colspan="2">0.98</td>
                <td colspan="2">NR</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table5fn1">
              <p><sup>a</sup>Recall: proportion of correctly identified positives among the real positive.</p>
            </fn>
            <fn id="table5fn2">
              <p><sup>b</sup>Specificity: the proportion of actual negatives, which got predicted as the negative (or true negative).</p>
            </fn>
            <fn id="table5fn3">
              <p><sup>c</sup>Precision: proportion of correctly identified positives among all classified positives.</p>
            </fn>
            <fn id="table5fn4">
              <p><sup>d</sup>F-score: harmonic mean of the precision and recall. F-score is equivalent to F1-score and used interchangeably.</p>
            </fn>
            <fn id="table5fn5">
              <p><sup>e</sup>AUC: area under the curve traced out by graphing the true positive rate against the false positive rate. The higher the AUC, the better the classifier prediction.</p>
            </fn>
            <fn id="table5fn6">
              <p><sup>f</sup>Accuracy: number of correctly predicted documents out of all classified documents.</p>
            </fn>
            <fn id="table5fn7">
              <p><sup>g</sup>Calculated as F-measure=(2*precision*recall)/(precision+recall) using recall and precision when available from the articles.</p>
            </fn>
            <fn id="table5fn8">
              <p><sup>h</sup>NR: not reported.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Summary</title>
        <p>To our knowledge, this is the first systematic review of machine learning approaches used to classify scientifically sound and clinically relevant studies from the biomedical literature. All included studies followed a supervised machine learning technique in which the learning algorithm depends on prelabeled data provided for training [<xref ref-type="bibr" rid="ref41">41</xref>]. Despite the technological advancements from 2003 to 2020 when the studies were published, none reported applying unsupervised or active learning approaches for the classification of articles based on quality. Active learning is a subtype of machine learning in which the learning algorithm is allowed to select the data from which it learns by querying a human operator and can achieve a performance comparable to the standard supervised learning algorithms with fewer labeled data [<xref ref-type="bibr" rid="ref21">21</xref>]. For example, active learning was used in the recent work by Gates et al [<xref ref-type="bibr" rid="ref61">61</xref>] and Tsou et al [<xref ref-type="bibr" rid="ref62">62</xref>], who used Abstrackr, a freely available active machine learning tool that automates the screening of titles and abstracts [<xref ref-type="bibr" rid="ref63">63</xref>]. Abstrackr achieved 100% sensitivity after screening only 31.8% of the citations in the dataset [<xref ref-type="bibr" rid="ref63">63</xref>].</p>
        <p>There is a limited range of quality standards comprising the prelabeled training datasets across the included articles. ACP Journal Club and the Clinical Hedges follow the same inclusion and exclusion criteria for high-quality evidence [<xref ref-type="bibr" rid="ref4">4</xref>]. Aphinyanaphongs et al [<xref ref-type="bibr" rid="ref49">49</xref>] considered an article as high-quality if it were included in ACP Journal Club but considered only those classified as treatment, which limits their results to RCTs. The authors expanded their inclusion to articles tagged as treatment, diagnosis, prognosis, and etiology in their subsequent studies [<xref ref-type="bibr" rid="ref50">50</xref>,<xref ref-type="bibr" rid="ref51">51</xref>]. Having consistency across gold standard databases in classifier development strengthens our ability to compare performance. There are, however, limited manually annotated datasets available as these are time consuming and expensive to develop and require consistency and highly skilled people. Using studies that are included in guidelines and systematic reviews, as done by Bian et al [<xref ref-type="bibr" rid="ref54">54</xref>,<xref ref-type="bibr" rid="ref55">55</xref>] and Afzal et al [<xref ref-type="bibr" rid="ref56">56</xref>], leverages screening work that has already been completed to a high standard; however, citations in guidelines may include lower quality evidence in the training process [<xref ref-type="bibr" rid="ref64">64</xref>].</p>
        <p>The limited availability of high-quality dataset options was highlighted by Afzal et al [<xref ref-type="bibr" rid="ref56">56</xref>], and finding the ideal gold standard training dataset was the most reported limitation in the included studies. In our opinion, the ideal gold standard training dataset should cover some criteria to overcome the limitations reported in the articles. First, the gold standard should be defined by precise criteria for methodological rigor that is created and recognized by experts in the field [<xref ref-type="bibr" rid="ref50">50</xref>]. Selection criteria for the gold standard should be unbiased. Aphinyanaphongs et al [<xref ref-type="bibr" rid="ref50">50</xref>] described their concern toward the possibility of a selection bias by the ACP Journal Club editors in a particular year toward a certain topic. Second, the gold standard training dataset should cover a large enough sample of the high-quality class to properly train the model and overcome the class imbalance bias toward the majority class of studies that are not of high quality [<xref ref-type="bibr" rid="ref63">63</xref>,<xref ref-type="bibr" rid="ref65">65</xref>]. Third, the gold standard training set should cover multiple health care domains, as Lin et al [<xref ref-type="bibr" rid="ref52">52</xref>] reported their high-quality dataset was limited only to cardiovascular diseases and would not perform as well if applied to another medical domain. Fourth, the gold standard training dataset should be up to date as much as possible, which was a limitation reported in both studies by Bian et al [<xref ref-type="bibr" rid="ref54">54</xref>] and Afzal et al [<xref ref-type="bibr" rid="ref56">56</xref>].</p>
        <p>Another possible constraint affecting accurate prediction is the feature selection process. Del Fiol et al [<xref ref-type="bibr" rid="ref35">35</xref>] stated that using MeSH-based features instead of the sole reliance on text features in their experiment could have improved the precision of their neural network. In consensus with the recommendation of Del Fiol et al [<xref ref-type="bibr" rid="ref35">35</xref>], some of the included studies provided evidence that the use of a combination of features improves the overall performance of the classifiers. For example, in the experiment by Afzal et al [<xref ref-type="bibr" rid="ref36">36</xref>], the combination of publication type and MeSH term features in addition to title and abstract features produced the best and the most stable results. Also, Kilicoglu et al [<xref ref-type="bibr" rid="ref53">53</xref>] proved that the incorporation of MEDLINE citation metadata and Unified Medical Language System features in addition to words of titles and abstracts yielded the best performance. Such important features may not be immediately available at the time of indexing in MEDLINE [<xref ref-type="bibr" rid="ref19">19</xref>], which poses a challenge in identifying recently published evidence [<xref ref-type="bibr" rid="ref52">52</xref>,<xref ref-type="bibr" rid="ref54">54</xref>].</p>
        <p>There was a higher rate of incorporating SVM algorithms in the experiments by the study authors. SVMs are known for their high accuracy [<xref ref-type="bibr" rid="ref66">66</xref>] and their low classification error [<xref ref-type="bibr" rid="ref41">41</xref>], making them ideal for linear classification. Afzal et al [<xref ref-type="bibr" rid="ref56">56</xref>] developed an ANN algorithm that had higher accuracy when compared with their previous SVM classifier [<xref ref-type="bibr" rid="ref36">36</xref>]. Further applications of newer machine learning approaches will advance the knowledge base on these quickly evolving methods. While SVMs currently have good accuracy and low error rates, emerging approaches may well outperform them.</p>
        <p>The main purpose of using machine learning in the classification of high-quality articles is to decrease the workload on those performing manual classification without losing relevant articles in the process. Recall, the proportion of correctly identified high-quality articles from the high-quality pool, is the most important metric to be used, followed by precision, the proportion of correctly identified positive articles among all those classified as positive. The included studies reported a range of recall and precision some of which would not meet the objective of identifying the high-quality articles correctly. For example, the NB classifier developed by Bian et al [<xref ref-type="bibr" rid="ref54">54</xref>] performed significantly less than the NB by Kilicoglu et al [<xref ref-type="bibr" rid="ref53">53</xref>] and PubMed Best Match in terms of recall (23% vs 55% and 65%, respectively). Despite performing worse in recall, their classifier achieved a higher precision (33% vs 5% and 4%) [<xref ref-type="bibr" rid="ref54">54</xref>].</p>
        <p>Additionally, accuracy, the number of correctly predicted documents out of all classified documents, is considered a common metric for evaluating classifiers; however, its use is considered inappropriate to evaluate imbalanced dataset classification [<xref ref-type="bibr" rid="ref67">67</xref>]. For example, a classifier labeling all entries as false (given that false is the majority class) would have high accuracy but would fail to perform the needed task of accurately classifying the passing articles (rare class), making it useless [<xref ref-type="bibr" rid="ref68">68</xref>]. The harmonic mean of the recall and precision measurements is the F-score, and it is used to evaluate the machine learning algorithms implemented on unbalanced datasets [<xref ref-type="bibr" rid="ref67">67</xref>]. F-score was first used in the study by Kilicoglu et al [<xref ref-type="bibr" rid="ref53">53</xref>] where the performance of the classifiers was reported using recall, precision, F-score, and AUC, without including accuracy. Additionally, Afzal et al [<xref ref-type="bibr" rid="ref36">36</xref>] did not rely on recall to compare between multiple classifiers; instead, they used the F-score, precision, and accuracy. Also, they have applied a novel approach to compare between the classifiers, in which they summed the metrics for a classifier with a higher sum reflecting better performance [<xref ref-type="bibr" rid="ref36">36</xref>].</p>
        <p>The highest reported recall in our review was 98% with the SVM developed by Aphinyanaphongs and Aliferis [<xref ref-type="bibr" rid="ref51">51</xref>], however, the algorithm had low precision of 30.5%. The best balance between recall and precision was achieved by the ANN approach used by Afzal et al [<xref ref-type="bibr" rid="ref56">56</xref>], which reported a high recall of 95.1% and a high precision of 86.3%, thereby achieving the target of not losing quality literature while decreasing the manual classification workload.</p>
        <p>The experiment by Kilicoglu et al [<xref ref-type="bibr" rid="ref53">53</xref>] assesses the effect of applying 3 different machine learning classifiers (SVM, NB, boosting, and ensemble) trained using the same Clinical Hedges dataset on the overall performance of the resulting models. Using multiple feature set combinations, the highest recall was achieved by the NB classifier, and the highest F-scores were achieved by ensemble (0.80) and text-boosting (0.77) based models [<xref ref-type="bibr" rid="ref53">53</xref>]. Only the studies by Aphinyanaphongs and colleagues [<xref ref-type="bibr" rid="ref49">49</xref>,<xref ref-type="bibr" rid="ref50">50</xref>] and Kilicoglu et al [<xref ref-type="bibr" rid="ref53">53</xref>] incorporated ensemble techniques in the development of their main classifiers, and their results suggest that using multiple classifiers in combination can improve the balance between recall and precision (the F-score).</p>
      </sec>
      <sec>
        <title>Strengths and Limitations</title>
        <p>This is the first systematic review to characterize the machine learning approaches in high-quality article retrieval. When narrowing our research question, we excluded other text summarization and text categorization approaches being used in the biomedical literature. These include but are not limited to studies concerned with the automation of the systematic review process [<xref ref-type="bibr" rid="ref69">69</xref>,<xref ref-type="bibr" rid="ref70">70</xref>], biomedical literature summarization [<xref ref-type="bibr" rid="ref71">71</xref>], and semantic models’ applications in the biomedical literature [<xref ref-type="bibr" rid="ref72">72</xref>]. Given the technical nature of the application of machine learning approaches for text classification, we expanded our search beyond clinical bibliographic databases to include those which index technical articles.</p>
        <p>Across the included studies, some steps were not fully reported in the methods, including preprocessing steps, cross-validation folds, and features selected. To our knowledge, there are no reporting guidelines for machine learning approaches being applied for literature retrieval. The Equator Network includes 6 reporting guidelines for machine learning approaches; however, all 6 are focused on articles applying machine learning in clinical settings [<xref ref-type="bibr" rid="ref73">73</xref>]. For example, the most recently published guideline focuses on the reporting of interventions involving artificial intelligence in clinical trial protocols [<xref ref-type="bibr" rid="ref74">74</xref>]. The lack of reporting guidance for the NLP component of machine learning being applied in the biomedical literature creates a noticeable gap in reporting the steps of the applied approach, features used and justification for their use, and inconsistency in the reported performance achieved by the machine. As a result, there was a lack of consistency in the reporting of results and methods provided by the authors, which also limits our ability to compare the performance of the classifiers. Also, one of the limitations developing the review was the inability to directly compare the performance of the models across the included studies because of the different training datasets and the applied settings. Finally, a challenge with machine learning is that the algorithms are considered as being derived in a black box; an enigmatic interpretation that the machines provide findings and predictions without any accompanying explanation [<xref ref-type="bibr" rid="ref75">75</xref>].</p>
      </sec>
      <sec>
        <title>Conclusion</title>
        <p>Despite the longevity of research for the identification of high-quality literature using machine learning, evidence is still scarce and slowly progressing over time, and determining the most reliable approach is difficult as the field is quickly evolving. This slow progression in the field may have been caused by the lack of publicly available standard benchmarks for the identification of high-quality articles biomedical literature to compare the performance of the proposed methods. A similar problem was addressed in the molecular machine learning domain by creating MolecularNet, a large-scale, open-source, and high-quality benchmark for molecular learning algorithms [<xref ref-type="bibr" rid="ref76">76</xref>]. Our review provides a summary of current approaches and performance of machine learning models applied to retrieve high-quality evidence for clinical consideration from the biomedical literature and highlights the importance of selecting optimal quality gold standard data for training. The findings include that the use of different feature sets in combination with text features is likely to improve the performance of machine learning models. There is a lack of reporting consistency in the literature which makes replication of the experiments difficult. Supervised machine learning has been the focus to date. The rapid development in the field of NLP and the availability of new state of the art techniques such as Bidirectional Encoder Representations from Transformers (BERT) for language understanding [<xref ref-type="bibr" rid="ref77">77</xref>] and bio-BERT for biomedical text mining [<xref ref-type="bibr" rid="ref78">78</xref>] hold promise for future advances in the field of information extraction from the biomedical literature. Considering the increasingly available data to apply these approaches to, we anticipate that the performance of classifiers to identify high-quality evidence will continue to grow.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Features selected by the included articles.</p>
        <media xlink:href="medinform_v9i9e30401_app1.pdf" xlink:title="PDF File  (Adobe PDF File), 187 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">AUC</term>
          <def>
            <p>area under the receiver operating characteristic curve</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">ACP</term>
          <def>
            <p>American College of Physicians</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">ANN</term>
          <def>
            <p>artificial neural network</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">BERT</term>
          <def>
            <p>Bidirectional Encoder Representations from Transformers</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">CNN</term>
          <def>
            <p>convolutional neural network</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">DT</term>
          <def>
            <p>decision tree</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">EBM</term>
          <def>
            <p>evidence-based medicine</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">MeSH</term>
          <def>
            <p>Medical Subject Heading</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb9">NB</term>
          <def>
            <p>naïve Bayes</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb10">NLP</term>
          <def>
            <p>natural language processing</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb11">RCT</term>
          <def>
            <p>randomized controlled trial</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb12">SVM</term>
          <def>
            <p>support vector machine</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>We thank Rita Jezrawi and Hamza Issa for assistance screening articles for inclusion. We thank Dr Mehrdad Roham for proofreading the final version of the manuscript.</p>
    </ack>
    <fn-group>
      <fn fn-type="con">
        <p>All authors contributed to the design of the study. TN and WA developed the search strategies. WA ran the searches and led the screening and data abstraction. All authors contributed to the interpretation of the data. WA and CL drafted early versions of the manuscript. All authors supervised the study and reviewed and provided revisions to the manuscript. All authors approved the final manuscript.</p>
      </fn>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Guyatt</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Jaeschke</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Wilson</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Montori</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Richardson</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <person-group person-group-type="editor">
            <name name-style="western">
              <surname>Guyatt</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Rennie</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Meade</surname>
              <given-names>MO</given-names>
            </name>
            <name name-style="western">
              <surname>Cook</surname>
              <given-names>DJ</given-names>
            </name>
          </person-group>
          <article-title>What Is evidence-based medicine?</article-title>
          <source>Users’ Guides to the Medical Literature: A Manual for Evidence-Based Clinical Practice, 3rd Edition</source>
          <year>2015</year>
          <publisher-loc>New York</publisher-loc>
          <publisher-name>McGraw-Hill Education</publisher-name>
          <fpage>7</fpage>
          <lpage>14</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kamath</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Guyatt</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Importance of evidence-based medicine on research and practice</article-title>
          <source>Indian J Anaesth</source>
          <year>2016</year>
          <month>09</month>
          <volume>60</volume>
          <issue>9</issue>
          <fpage>622</fpage>
          <lpage>625</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.ijaweb.org/article.asp?issn=0019-5049;year=2016;volume=60;issue=9;spage=622;epage=625;aulast=Kamath"/>
          </comment>
          <pub-id pub-id-type="doi">10.4103/0019-5049.190615</pub-id>
          <pub-id pub-id-type="medline">27729686</pub-id>
          <pub-id pub-id-type="pii">IJA-60-622</pub-id>
          <pub-id pub-id-type="pmcid">PMC5037940</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="web">
          <source>MEDLINE PubMed Production Statistics</source>
          <access-date>2021-08-23</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.nlm.nih.gov/bsd/medline_pubmed_production_stats.html">https://www.nlm.nih.gov/bsd/medline_pubmed_production_stats.html</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wilczynski</surname>
              <given-names>NL</given-names>
            </name>
            <name name-style="western">
              <surname>Morgan</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Haynes</surname>
              <given-names>RB</given-names>
            </name>
            <collab>Hedges Team</collab>
          </person-group>
          <article-title>An overview of the design and methods for retrieving high-quality studies for clinical care</article-title>
          <source>BMC Med Inform Decis Mak</source>
          <year>2005</year>
          <month>06</month>
          <day>21</day>
          <volume>5</volume>
          <fpage>20</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedinformdecismak.biomedcentral.com/articles/10.1186/1472-6947-5-20"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/1472-6947-5-20</pub-id>
          <pub-id pub-id-type="medline">15969765</pub-id>
          <pub-id pub-id-type="pii">1472-6947-5-20</pub-id>
          <pub-id pub-id-type="pmcid">PMC1183213</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Beale</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Duffy</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Glanville</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Lefebvre</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Wright</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>McCool</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Varley</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Boachie</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Fraser</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Harbour</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Choosing and using methodological search filters: searchers' views</article-title>
          <source>Health Info Libr J</source>
          <year>2014</year>
          <month>04</month>
          <day>23</day>
          <volume>31</volume>
          <issue>2</issue>
          <fpage>133</fpage>
          <lpage>147</lpage>
          <pub-id pub-id-type="doi">10.1111/hir.12062</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wilczynski</surname>
              <given-names>NL</given-names>
            </name>
            <name name-style="western">
              <surname>Haynes</surname>
              <given-names>RB</given-names>
            </name>
            <collab>Hedges Team</collab>
          </person-group>
          <article-title>Developing optimal search strategies for detecting clinically sound causation studies in MEDLINE</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2003</year>
          <fpage>719</fpage>
          <lpage>723</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/14728267"/>
          </comment>
          <pub-id pub-id-type="medline">14728267</pub-id>
          <pub-id pub-id-type="pii">D030002662</pub-id>
          <pub-id pub-id-type="pmcid">PMC1480286</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Leeflang</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Scholten</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Rutjes</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Reitsma</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Bossuyt</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Use of methodological search filters to identify diagnostic accuracy studies can lead to the omission of relevant studies</article-title>
          <source>J Clin Epidemiol</source>
          <year>2006</year>
          <month>03</month>
          <volume>59</volume>
          <issue>3</issue>
          <fpage>234</fpage>
          <lpage>240</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jclinepi.2005.07.014</pub-id>
          <pub-id pub-id-type="medline">16488353</pub-id>
          <pub-id pub-id-type="pii">S0895-4356(05)00327-6</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Damarell</surname>
              <given-names>RA</given-names>
            </name>
            <name name-style="western">
              <surname>May</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Hammond</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Sladek</surname>
              <given-names>RM</given-names>
            </name>
            <name name-style="western">
              <surname>Tieman</surname>
              <given-names>JJ</given-names>
            </name>
          </person-group>
          <article-title>Topic search filters: a systematic scoping review</article-title>
          <source>Health Info Libr J</source>
          <year>2019</year>
          <month>03</month>
          <day>21</day>
          <volume>36</volume>
          <issue>1</issue>
          <fpage>4</fpage>
          <lpage>40</lpage>
          <pub-id pub-id-type="doi">10.1111/hir.12244</pub-id>
          <pub-id pub-id-type="medline">30578606</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>McKibbon</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Wilczynski</surname>
              <given-names>NL</given-names>
            </name>
            <name name-style="western">
              <surname>Haynes</surname>
              <given-names>R</given-names>
            </name>
            <collab>Hedges Team</collab>
          </person-group>
          <article-title>Retrieving randomized controlled trials from medline: a comparison of 38 published search filters</article-title>
          <source>Health Info Libr J</source>
          <year>2009</year>
          <month>09</month>
          <volume>26</volume>
          <issue>3</issue>
          <fpage>187</fpage>
          <lpage>202</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1111/j.1471-1842.2008.00827.x"/>
          </comment>
          <pub-id pub-id-type="doi">10.1111/j.1471-1842.2008.00827.x</pub-id>
          <pub-id pub-id-type="medline">19712211</pub-id>
          <pub-id pub-id-type="pii">HIR827</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Miller</surname>
              <given-names>PA</given-names>
            </name>
            <name name-style="western">
              <surname>McKibbon</surname>
              <given-names>KA</given-names>
            </name>
            <name name-style="western">
              <surname>Haynes</surname>
              <given-names>RB</given-names>
            </name>
          </person-group>
          <article-title>A quantitative analysis of research publications in physical therapy journals</article-title>
          <source>Phys Ther</source>
          <year>2003</year>
          <month>02</month>
          <volume>83</volume>
          <issue>2</issue>
          <fpage>123</fpage>
          <lpage>131</lpage>
          <pub-id pub-id-type="medline">12564948</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="web">
          <article-title>Search filters for MEDLINE in Ovid Syntax and the PubMed translation</article-title>
          <source>Health Information Research Unit, McMaster University</source>
          <access-date>2021-01-31</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://hiru.mcmaster.ca/hiru/HIRU_Hedges_MEDLINE_Strategies.aspx">https://hiru.mcmaster.ca/hiru/HIRU_Hedges_MEDLINE_Strategies.aspx</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="web">
          <article-title>Hedges</article-title>
          <source>Health Information Research Unit, McMaster University</source>
          <access-date>2021-05-31</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://hiru.mcmaster.ca/hiru/HIRU_Hedges_home.aspx">https://hiru.mcmaster.ca/hiru/HIRU_Hedges_home.aspx</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jadad</surname>
              <given-names>AR</given-names>
            </name>
            <name name-style="western">
              <surname>Moore</surname>
              <given-names>RA</given-names>
            </name>
            <name name-style="western">
              <surname>Carroll</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Jenkinson</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Reynolds</surname>
              <given-names>DJ</given-names>
            </name>
            <name name-style="western">
              <surname>Gavaghan</surname>
              <given-names>DJ</given-names>
            </name>
            <name name-style="western">
              <surname>McQuay</surname>
              <given-names>HJ</given-names>
            </name>
          </person-group>
          <article-title>Assessing the quality of reports of randomized clinical trials: is blinding necessary?</article-title>
          <source>Control Clin Trials</source>
          <year>1996</year>
          <month>02</month>
          <volume>17</volume>
          <issue>1</issue>
          <fpage>1</fpage>
          <lpage>12</lpage>
          <pub-id pub-id-type="doi">10.1016/0197-2456(95)00134-4</pub-id>
          <pub-id pub-id-type="medline">8721797</pub-id>
          <pub-id pub-id-type="pii">0197-2456(95)00134-4</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Higgins</surname>
              <given-names>JPT</given-names>
            </name>
            <name name-style="western">
              <surname>Altman</surname>
              <given-names>DG</given-names>
            </name>
            <name name-style="western">
              <surname>Gøtzsche</surname>
              <given-names>PC</given-names>
            </name>
            <name name-style="western">
              <surname>Jüni</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Moher</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Oxman</surname>
              <given-names>AD</given-names>
            </name>
            <name name-style="western">
              <surname>Savovic</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Schulz</surname>
              <given-names>KF</given-names>
            </name>
            <name name-style="western">
              <surname>Weeks</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Sterne</surname>
              <given-names>JAC</given-names>
            </name>
            <collab>Cochrane Bias Methods Group</collab>
            <collab>Cochrane Statistical Methods Group</collab>
          </person-group>
          <article-title>The Cochrane Collaboration's tool for assessing risk of bias in randomised trials</article-title>
          <source>BMJ</source>
          <year>2011</year>
          <month>10</month>
          <day>18</day>
          <volume>343</volume>
          <issue>oct18 2</issue>
          <fpage>d5928</fpage>
          <lpage>d5928</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/22008217"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/bmj.d5928</pub-id>
          <pub-id pub-id-type="medline">22008217</pub-id>
          <pub-id pub-id-type="pmcid">PMC3196245</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="web">
          <article-title>Inclusion Criteria</article-title>
          <source>Health Information Research Unit, McMaster University</source>
          <year>2019</year>
          <access-date>2021-05-31</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://hiru.mcmaster.ca/hiru/InclusionCriteria.html">https://hiru.mcmaster.ca/hiru/InclusionCriteria.html</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wong</surname>
              <given-names>SS</given-names>
            </name>
            <name name-style="western">
              <surname>Wilczynski</surname>
              <given-names>NL</given-names>
            </name>
            <name name-style="western">
              <surname>Haynes</surname>
              <given-names>RB</given-names>
            </name>
            <collab>Hedges Team</collab>
          </person-group>
          <article-title>Developing optimal search strategies for detecting clinically relevant qualitative studies in MEDLINE</article-title>
          <source>Stud Health Technol Inform</source>
          <year>2004</year>
          <volume>107</volume>
          <issue>Pt 1</issue>
          <fpage>311</fpage>
          <lpage>316</lpage>
          <pub-id pub-id-type="medline">15360825</pub-id>
          <pub-id pub-id-type="pii">D040004298</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gill</surname>
              <given-names>PJ</given-names>
            </name>
            <name name-style="western">
              <surname>Roberts</surname>
              <given-names>NW</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>KY</given-names>
            </name>
            <name name-style="western">
              <surname>Heneghan</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Development of a search filter for identifying studies completed in primary care</article-title>
          <source>Fam Pract</source>
          <year>2014</year>
          <month>12</month>
          <day>18</day>
          <volume>31</volume>
          <issue>6</issue>
          <fpage>739</fpage>
          <lpage>745</lpage>
          <pub-id pub-id-type="doi">10.1093/fampra/cmu066</pub-id>
          <pub-id pub-id-type="medline">25326923</pub-id>
          <pub-id pub-id-type="pii">cmu066</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wilczynski</surname>
              <given-names>NL</given-names>
            </name>
            <name name-style="western">
              <surname>McKibbon</surname>
              <given-names>KA</given-names>
            </name>
            <name name-style="western">
              <surname>Walter</surname>
              <given-names>SD</given-names>
            </name>
            <name name-style="western">
              <surname>Garg</surname>
              <given-names>AX</given-names>
            </name>
            <name name-style="western">
              <surname>Haynes</surname>
              <given-names>RB</given-names>
            </name>
          </person-group>
          <article-title>MEDLINE clinical queries are robust when searching in recent publishing years</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2013</year>
          <volume>20</volume>
          <issue>2</issue>
          <fpage>363</fpage>
          <lpage>368</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/23019242"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/amiajnl-2012-001075</pub-id>
          <pub-id pub-id-type="medline">23019242</pub-id>
          <pub-id pub-id-type="pii">amiajnl-2012-001075</pub-id>
          <pub-id pub-id-type="pmcid">PMC3638187</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Irwin</surname>
              <given-names>AN</given-names>
            </name>
            <name name-style="western">
              <surname>Rackham</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Comparison of the time-to-indexing in PubMed between biomedical journals according to impact factor, discipline, and focus</article-title>
          <source>Res Social Adm Pharm</source>
          <year>2017</year>
          <volume>13</volume>
          <issue>2</issue>
          <fpage>389</fpage>
          <lpage>393</lpage>
          <pub-id pub-id-type="doi">10.1016/j.sapharm.2016.04.006</pub-id>
          <pub-id pub-id-type="medline">27215603</pub-id>
          <pub-id pub-id-type="pii">S1551-7411(16)30019-5</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tsafnat</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Glasziou</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Karystianis</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Coiera</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Automated screening of research studies for systematic reviews using study characteristics</article-title>
          <source>Syst Rev</source>
          <year>2018</year>
          <month>04</month>
          <day>25</day>
          <volume>7</volume>
          <issue>1</issue>
          <fpage>64</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://systematicreviewsjournal.biomedcentral.com/articles/10.1186/s13643-018-0724-7"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s13643-018-0724-7</pub-id>
          <pub-id pub-id-type="medline">29695296</pub-id>
          <pub-id pub-id-type="pii">10.1186/s13643-018-0724-7</pub-id>
          <pub-id pub-id-type="pmcid">PMC5918752</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mohri</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Rostamizadeh</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Talwalkar</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <person-group person-group-type="editor">
            <name name-style="western">
              <surname>Bach</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <source>Foundations of Machine Learning, Second edition</source>
          <year>2018</year>
          <publisher-loc>Cambridge</publisher-loc>
          <publisher-name>MIT Press</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mitchell</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <source>Machine Learning, 1st ed</source>
          <year>1997</year>
          <publisher-loc>New York</publisher-loc>
          <publisher-name>McGraw-Hill Science</publisher-name>
          <fpage>432</fpage>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Koh</surname>
              <given-names>HC</given-names>
            </name>
            <name name-style="western">
              <surname>Tan</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Data mining applications in healthcare</article-title>
          <source>J Healthc Inf Manag</source>
          <year>2005</year>
          <volume>19</volume>
          <issue>2</issue>
          <fpage>64</fpage>
          <lpage>72</lpage>
          <pub-id pub-id-type="medline">15869215</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bahri</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zoghlami</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Abed</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Tavares</surname>
              <given-names>JMRS</given-names>
            </name>
          </person-group>
          <article-title>Big data for healthcare: a survey</article-title>
          <source>IEEE Access</source>
          <year>2019</year>
          <volume>7</volume>
          <fpage>7397</fpage>
          <lpage>7408</lpage>
          <pub-id pub-id-type="doi">10.1109/access.2018.2889180</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Beam</surname>
              <given-names>AL</given-names>
            </name>
            <name name-style="western">
              <surname>Kohane</surname>
              <given-names>IS</given-names>
            </name>
          </person-group>
          <article-title>Big data and machine learning in health care</article-title>
          <source>JAMA</source>
          <year>2018</year>
          <month>04</month>
          <day>03</day>
          <volume>319</volume>
          <issue>13</issue>
          <fpage>1317</fpage>
          <lpage>1318</lpage>
          <pub-id pub-id-type="doi">10.1001/jama.2017.18391</pub-id>
          <pub-id pub-id-type="medline">29532063</pub-id>
          <pub-id pub-id-type="pii">2675024</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wiens</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Shenoy</surname>
              <given-names>ES</given-names>
            </name>
          </person-group>
          <article-title>Machine learning for healthcare: on the verge of a major shift in healthcare epidemiology</article-title>
          <source>Clin Infect Dis</source>
          <year>2018</year>
          <month>01</month>
          <day>06</day>
          <volume>66</volume>
          <issue>1</issue>
          <fpage>149</fpage>
          <lpage>153</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/29020316"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/cid/cix731</pub-id>
          <pub-id pub-id-type="medline">29020316</pub-id>
          <pub-id pub-id-type="pii">4085880</pub-id>
          <pub-id pub-id-type="pmcid">PMC5850539</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wiens</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Guttag</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Horvitz</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Patient risk stratification with time-varying parameters: a multitask learning approach</article-title>
          <source>J Mach Learning Res</source>
          <year>2016</year>
          <volume>17</volume>
          <fpage>1</fpage>
          <lpage>23</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://jmlr.org/papers/volume17/15-177/15-177.pdf"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/b978-0-12-802121-7.00045-5</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wiens</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Guttag</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Horvitz</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>A study in transfer learning: leveraging data from multiple hospitals to enhance hospital-specific predictions</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2014</year>
          <volume>21</volume>
          <issue>4</issue>
          <fpage>699</fpage>
          <lpage>706</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://jamia.oxfordjournals.org/cgi/pmidlookup?view=long&#38;pmid=24481703"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/amiajnl-2013-002162</pub-id>
          <pub-id pub-id-type="medline">24481703</pub-id>
          <pub-id pub-id-type="pii">amiajnl-2013-002162</pub-id>
          <pub-id pub-id-type="pmcid">PMC4078276</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wiens</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Horvitz</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Guttag</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <person-group person-group-type="editor">
            <name name-style="western">
              <surname>Pereira</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Burges</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Bottou</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Weinberger</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Patient risk stratification for hospital-associated C. diff as a time-series classification task</article-title>
          <source>Advances in Neural Information Processing Systems</source>
          <year>2012</year>
          <publisher-loc>Red Hook</publisher-loc>
          <publisher-name>Curran Associates, Inc</publisher-name>
          <fpage>467</fpage>
          <lpage>475</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Burkov</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <source>The Hundred-Page Machine Learning Book, 1st ed</source>
          <year>2019</year>
          <publisher-loc>Quebec City</publisher-loc>
          <publisher-name>Andriy Burkov</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hearst</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <person-group person-group-type="editor">
            <name name-style="western">
              <surname>Mitkov</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Text Data Mining</article-title>
          <source>The Oxford Handbook of Computational Linguistics (1st ed)</source>
          <year>2012</year>
          <publisher-loc>Oxford</publisher-loc>
          <publisher-name>Oxford University Press</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gong</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Application of biomedical text mining</article-title>
          <source>Artificial Intelligence—Emerging Trends and Applications InTech</source>
          <year>2018</year>
          <publisher-loc>London</publisher-loc>
          <publisher-name>IntechOpen</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Davidoff</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Miglus</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Delivering clinical evidence where it's needed: building an information system worthy of the profession</article-title>
          <source>JAMA</source>
          <year>2011</year>
          <month>05</month>
          <day>11</day>
          <volume>305</volume>
          <issue>18</issue>
          <fpage>1906</fpage>
          <lpage>1907</lpage>
          <pub-id pub-id-type="doi">10.1001/jama.2011.619</pub-id>
          <pub-id pub-id-type="medline">21558524</pub-id>
          <pub-id pub-id-type="pii">305/18/1906</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mishra</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Bian</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Fiszman</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Weir</surname>
              <given-names>CR</given-names>
            </name>
            <name name-style="western">
              <surname>Jonnalagadda</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Mostafa</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Del Fiol</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Text summarization in the biomedical domain: a systematic review of recent research</article-title>
          <source>J Biomed Inform</source>
          <year>2014</year>
          <month>12</month>
          <volume>52</volume>
          <fpage>457</fpage>
          <lpage>467</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(14)00147-6"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2014.06.009</pub-id>
          <pub-id pub-id-type="medline">25016293</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(14)00147-6</pub-id>
          <pub-id pub-id-type="pmcid">PMC4261035</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Del Fiol</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Michelson</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Iorio</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Cotoi</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Haynes</surname>
              <given-names>RB</given-names>
            </name>
          </person-group>
          <article-title>A deep learning method to automatically identify reports of scientifically rigorous clinical research from the biomedical literature: comparative analytic study</article-title>
          <source>J Med Internet Res</source>
          <year>2018</year>
          <month>06</month>
          <day>25</day>
          <volume>20</volume>
          <issue>6</issue>
          <fpage>e10281</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2018/6/e10281/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/10281</pub-id>
          <pub-id pub-id-type="medline">29941415</pub-id>
          <pub-id pub-id-type="pii">v20i6e10281</pub-id>
          <pub-id pub-id-type="pmcid">PMC6037944</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Afzal</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Hussain</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Haynes</surname>
              <given-names>RB</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Context-aware grading of quality evidences for evidence-based decision-making</article-title>
          <source>Health Informatics J</source>
          <year>2019</year>
          <month>06</month>
          <volume>25</volume>
          <issue>2</issue>
          <fpage>429</fpage>
          <lpage>445</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://journals.sagepub.com/doi/10.1177/1460458217719560?url_ver=Z39.88-2003&#38;rfr_id=ori:rid:crossref.org&#38;rfr_dat=cr_pub%3dpubmed"/>
          </comment>
          <pub-id pub-id-type="doi">10.1177/1460458217719560</pub-id>
          <pub-id pub-id-type="medline">28766402</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wallace</surname>
              <given-names>BC</given-names>
            </name>
            <name name-style="western">
              <surname>Small</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Brodley</surname>
              <given-names>CE</given-names>
            </name>
            <name name-style="western">
              <surname>Lau</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Schmid</surname>
              <given-names>CH</given-names>
            </name>
            <name name-style="western">
              <surname>Bertram</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Lill</surname>
              <given-names>CM</given-names>
            </name>
            <name name-style="western">
              <surname>Cohen</surname>
              <given-names>JT</given-names>
            </name>
            <name name-style="western">
              <surname>Trikalinos</surname>
              <given-names>TA</given-names>
            </name>
          </person-group>
          <article-title>Toward modernizing the systematic review pipeline in genetics: efficient updating via data mining</article-title>
          <source>Genet Med</source>
          <year>2012</year>
          <month>07</month>
          <volume>14</volume>
          <issue>7</issue>
          <fpage>663</fpage>
          <lpage>669</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/22481134"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/gim.2012.7</pub-id>
          <pub-id pub-id-type="medline">22481134</pub-id>
          <pub-id pub-id-type="pii">gim20127</pub-id>
          <pub-id pub-id-type="pmcid">PMC3908550</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wallace</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Small</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Brodley</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Lau</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Trikalinos</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Deploying an interactive machine learning system in an evidence-based practice center: Abstrackr</article-title>
          <source>Proc 2nd ACM SIGHIT Int Health Informat Symp</source>
          <year>2012</year>
          <fpage>819</fpage>
          <lpage>824</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.intechopen.com/chapters/60491"/>
          </comment>
          <pub-id pub-id-type="doi">10.1145/2110363.2110464</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rindflesch</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Fiszman</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Libbus</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Semantic interpretation for the biomedical research literature</article-title>
          <source>Med Informatics</source>
          <year>2006</year>
          <fpage>399</fpage>
          <lpage>422</lpage>
          <pub-id pub-id-type="doi">10.1007/0-387-25739-x_14</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Holzinger</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Machine learning for health informatics</article-title>
          <source>LNCS</source>
          <year>2016</year>
          <volume>9605</volume>
          <fpage>1</fpage>
          <lpage>24</lpage>
          <pub-id pub-id-type="doi">10.1007/978-3-319-50478-0_1</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dey</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Machine learning algorithms: a review</article-title>
          <source>Int J Comput Sci Inf Technol</source>
          <year>2016</year>
          <volume>7</volume>
          <issue>3</issue>
          <fpage>1174</fpage>
          <lpage>1179</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://ijcsit.com/docs/Volume%207/vol7issue3/ijcsit2016070332.pdf"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cohen</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>The basics of machine learning: strategies and techniques</article-title>
          <source>Artificial Intelligence and Deep Learning in Pathology</source>
          <year>2021</year>
          <publisher-loc>Philadelphia</publisher-loc>
          <publisher-name>Elsevier</publisher-name>
          <fpage>13</fpage>
          <lpage>40</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Welling</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>A First Encounter with Machine Learning</article-title>
          <source>University of California Irvine</source>
          <year>2011</year>
          <access-date>2021-08-23</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://citeseerx.ist.psu.edu/viewdoc/download?doi=10.1.1.441.6238&#38;rep=rep1&#38;type=pdf">http://citeseerx.ist.psu.edu/viewdoc/download?doi=10.1.1.441.6238&#38;rep=rep1&#38;type=pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Artificial neural network</article-title>
          <source>Interdisciplinary Computing in Java Programming</source>
          <year>2003</year>
          <publisher-loc>Boston</publisher-loc>
          <publisher-name>Springer US</publisher-name>
          <fpage>81</fpage>
          <lpage>100</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hiregoudar</surname>
              <given-names>SB</given-names>
            </name>
            <name name-style="western">
              <surname>Manjunath</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Patil</surname>
              <given-names>KS</given-names>
            </name>
          </person-group>
          <article-title>A survey: research summary on neural networks</article-title>
          <source>Int J Res Engineer Technol</source>
          <year>2014</year>
          <month>05</month>
          <day>25</day>
          <volume>03</volume>
          <issue>15</issue>
          <fpage>385</fpage>
          <lpage>389</lpage>
          <pub-id pub-id-type="doi">10.15623/ijret.2014.0315076</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Marshall</surname>
              <given-names>IJ</given-names>
            </name>
            <name name-style="western">
              <surname>Noel-Storr</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Kuiper</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Thomas</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wallace</surname>
              <given-names>BC</given-names>
            </name>
          </person-group>
          <article-title>Machine learning for identifying randomized controlled trials: an evaluation and practitioner's guide</article-title>
          <source>Res Synth Methods</source>
          <year>2018</year>
          <month>12</month>
          <volume>9</volume>
          <issue>4</issue>
          <fpage>602</fpage>
          <lpage>614</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/29314757"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/jrsm.1287</pub-id>
          <pub-id pub-id-type="medline">29314757</pub-id>
          <pub-id pub-id-type="pmcid">PMC6030513</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Agarwal</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Mittal</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Text classification using machine learning methods: a survey</article-title>
          <year>2014</year>
          <conf-name>Proceedings of the Second International Conference on Soft Computing for Problem Solving</conf-name>
          <conf-date>2014</conf-date>
          <conf-loc>New Delhi</conf-loc>
          <fpage>701</fpage>
          <lpage>709</lpage>
          <pub-id pub-id-type="doi">10.1007/978-81-322-1602-5_75</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Page</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>McKenzie</surname>
              <given-names>JE</given-names>
            </name>
            <name name-style="western">
              <surname>Bossuyt</surname>
              <given-names>PM</given-names>
            </name>
            <name name-style="western">
              <surname>Boutron</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Hoffmann</surname>
              <given-names>TC</given-names>
            </name>
            <name name-style="western">
              <surname>Mulrow</surname>
              <given-names>CD</given-names>
            </name>
            <name name-style="western">
              <surname>Shamseer</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Tetzlaff</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Akl</surname>
              <given-names>EA</given-names>
            </name>
            <name name-style="western">
              <surname>Brennan</surname>
              <given-names>SE</given-names>
            </name>
            <name name-style="western">
              <surname>Chou</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Glanville</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Grimshaw</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Hróbjartsson</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Lalu</surname>
              <given-names>MM</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Loder</surname>
              <given-names>EW</given-names>
            </name>
            <name name-style="western">
              <surname>Mayo-Wilson</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>McDonald</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>McGuinness</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Stewart</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Thomas</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Tricco</surname>
              <given-names>AC</given-names>
            </name>
            <name name-style="western">
              <surname>Welch</surname>
              <given-names>VA</given-names>
            </name>
            <name name-style="western">
              <surname>Whiting</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Moher</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>The PRISMA 2020 statement: an updated guideline for reporting systematic reviews</article-title>
          <source>BMJ</source>
          <year>2021</year>
          <month>03</month>
          <day>29</day>
          <volume>372</volume>
          <fpage>n71</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.bmj.com/lookup/pmidlookup?view=long&#38;pmid=33782057"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/bmj.n71</pub-id>
          <pub-id pub-id-type="medline">33782057</pub-id>
          <pub-id pub-id-type="pmcid">PMC8005924</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref49">
        <label>49</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Aphinyanaphongs</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Aliferis</surname>
              <given-names>CF</given-names>
            </name>
          </person-group>
          <article-title>Text categorization models for retrieval of high quality articles in internal medicine</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2003</year>
          <fpage>31</fpage>
          <lpage>35</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/14728128"/>
          </comment>
          <pub-id pub-id-type="medline">14728128</pub-id>
          <pub-id pub-id-type="pii">D030003601</pub-id>
          <pub-id pub-id-type="pmcid">PMC1480096</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref50">
        <label>50</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Aphinyanaphongs</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Tsamardinos</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Statnikov</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Hardin</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Aliferis</surname>
              <given-names>CF</given-names>
            </name>
          </person-group>
          <article-title>Text categorization models for high-quality article retrieval in internal medicine</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2005</year>
          <volume>12</volume>
          <issue>2</issue>
          <fpage>207</fpage>
          <lpage>216</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://jamia.oxfordjournals.org/cgi/pmidlookup?view=long&#38;pmid=15561789"/>
          </comment>
          <pub-id pub-id-type="doi">10.1197/jamia.M1641</pub-id>
          <pub-id pub-id-type="medline">15561789</pub-id>
          <pub-id pub-id-type="pii">M1641</pub-id>
          <pub-id pub-id-type="pmcid">PMC551552</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref51">
        <label>51</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Aphinyanaphongs</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Aliferis</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Prospective validation of text categorization filters for identifying high-quality, content-specific articles in MEDLINE</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2006</year>
          <fpage>6</fpage>
          <lpage>10</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/17238292"/>
          </comment>
          <pub-id pub-id-type="medline">17238292</pub-id>
          <pub-id pub-id-type="pii">86426</pub-id>
          <pub-id pub-id-type="pmcid">PMC1839419</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref52">
        <label>52</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ebell</surname>
              <given-names>MH</given-names>
            </name>
            <name name-style="western">
              <surname>Chiang</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Automating the process of critical appraisal and assessing the strength of evidence with information extraction technology</article-title>
          <source>J Eval Clin Pract</source>
          <year>2011</year>
          <month>08</month>
          <volume>17</volume>
          <issue>4</issue>
          <fpage>832</fpage>
          <lpage>838</lpage>
          <pub-id pub-id-type="doi">10.1111/j.1365-2753.2011.01712.x</pub-id>
          <pub-id pub-id-type="medline">21707873</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref53">
        <label>53</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kilicoglu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Demner-Fushman</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Rindflesch</surname>
              <given-names>TC</given-names>
            </name>
            <name name-style="western">
              <surname>Wilczynski</surname>
              <given-names>NL</given-names>
            </name>
            <name name-style="western">
              <surname>Haynes</surname>
              <given-names>RB</given-names>
            </name>
          </person-group>
          <article-title>Towards automatic recognition of scientifically rigorous clinical research evidence</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2009</year>
          <volume>16</volume>
          <issue>1</issue>
          <fpage>25</fpage>
          <lpage>31</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/18952929"/>
          </comment>
          <pub-id pub-id-type="doi">10.1197/jamia.M2996</pub-id>
          <pub-id pub-id-type="medline">18952929</pub-id>
          <pub-id pub-id-type="pii">M2996</pub-id>
          <pub-id pub-id-type="pmcid">PMC2605595</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref54">
        <label>54</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bian</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Morid</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Jonnalagadda</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Luo</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Del Fiol</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Automatic identification of high impact articles in PubMed to support clinical decision making</article-title>
          <source>J Biomed Inform</source>
          <year>2017</year>
          <month>09</month>
          <volume>73</volume>
          <fpage>95</fpage>
          <lpage>103</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(17)30171-5"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2017.07.015</pub-id>
          <pub-id pub-id-type="medline">28756159</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(17)30171-5</pub-id>
          <pub-id pub-id-type="pmcid">PMC5583030</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref55">
        <label>55</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bian</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Abdelrahman</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Shi</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Del Fiol</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Automatic identification of recent high impact clinical articles in PubMed to support clinical decision making using time-agnostic features</article-title>
          <source>J Biomed Inform</source>
          <year>2019</year>
          <month>01</month>
          <volume>89</volume>
          <fpage>1</fpage>
          <lpage>10</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(18)30219-3"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2018.11.010</pub-id>
          <pub-id pub-id-type="medline">30468912</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(18)30219-3</pub-id>
          <pub-id pub-id-type="pmcid">PMC6342626</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref56">
        <label>56</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Afzal</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Park</surname>
              <given-names>BJ</given-names>
            </name>
            <name name-style="western">
              <surname>Hussain</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Deep learning based biomedical literature classification using criteria of scientific rigor</article-title>
          <source>Electronics (Switzerland)</source>
          <year>2020</year>
          <month>08</month>
          <day>05</day>
          <volume>9</volume>
          <issue>8</issue>
          <fpage>1</fpage>
          <lpage>12</lpage>
          <pub-id pub-id-type="doi">10.3390/electronics9081253</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref57">
        <label>57</label>
        <nlm-citation citation-type="web">
          <article-title>PubMed Clinical Queries Search Filter</article-title>
          <source>National Library of Medicine</source>
          <access-date>2021-05-01</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://pubmed.ncbi.nlm.nih.gov/clinical/">https://pubmed.ncbi.nlm.nih.gov/clinical/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref58">
        <label>58</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sarker</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Mollá</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Paris</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Automatic evidence quality prediction to support evidence-based decision making</article-title>
          <source>Artif Intell Med</source>
          <year>2015</year>
          <month>06</month>
          <volume>64</volume>
          <issue>2</issue>
          <fpage>89</fpage>
          <lpage>103</lpage>
          <pub-id pub-id-type="doi">10.1016/j.artmed.2015.04.001</pub-id>
          <pub-id pub-id-type="medline">25983133</pub-id>
          <pub-id pub-id-type="pii">S0933-3657(15)00041-X</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref59">
        <label>59</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chiang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Automated evaluation of electronic discharge notes to assess quality of care for cardiovascular diseases using Medical Language Extraction and Encoding System (MedLEE)</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2010</year>
          <month>05</month>
          <day>01</day>
          <volume>17</volume>
          <issue>3</issue>
          <fpage>245</fpage>
          <lpage>252</lpage>
          <pub-id pub-id-type="doi">10.1136/jamia.2009.000182</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref60">
        <label>60</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rau</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Shih</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Evaluation of Cohen's kappa and other measures of inter-rater agreement for genre analysis and other nominal data</article-title>
          <source>J Engl Acad Purposes</source>
          <year>2021</year>
          <month>09</month>
          <volume>53</volume>
          <fpage>101026</fpage>
          <pub-id pub-id-type="doi">10.1016/j.jeap.2021.101026</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref61">
        <label>61</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gates</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Hartling</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Technology-assisted title and abstract screening for systematic reviews: a retrospective evaluation of the Abstrackr machine learning tool</article-title>
          <source>Syst Rev</source>
          <year>2018</year>
          <month>03</month>
          <day>12</day>
          <volume>7</volume>
          <issue>1</issue>
          <fpage>45</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://systematicreviewsjournal.biomedcentral.com/articles/10.1186/s13643-018-0707-8"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s13643-018-0707-8</pub-id>
          <pub-id pub-id-type="medline">29530097</pub-id>
          <pub-id pub-id-type="pii">10.1186/s13643-018-0707-8</pub-id>
          <pub-id pub-id-type="pmcid">PMC5848519</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref62">
        <label>62</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tsou</surname>
              <given-names>AY</given-names>
            </name>
            <name name-style="western">
              <surname>Treadwell</surname>
              <given-names>JR</given-names>
            </name>
            <name name-style="western">
              <surname>Erinoff</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Schoelles</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Machine learning for screening prioritization in systematic reviews: comparative performance of Abstrackr and EPPI-Reviewer</article-title>
          <source>Syst Rev</source>
          <year>2020</year>
          <month>04</month>
          <day>02</day>
          <volume>9</volume>
          <issue>1</issue>
          <fpage>73</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://systematicreviewsjournal.biomedcentral.com/articles/10.1186/s13643-020-01324-7"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s13643-020-01324-7</pub-id>
          <pub-id pub-id-type="medline">32241297</pub-id>
          <pub-id pub-id-type="pii">10.1186/s13643-020-01324-7</pub-id>
          <pub-id pub-id-type="pmcid">PMC7118839</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref63">
        <label>63</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wallace</surname>
              <given-names>BC</given-names>
            </name>
            <name name-style="western">
              <surname>Trikalinos</surname>
              <given-names>TA</given-names>
            </name>
            <name name-style="western">
              <surname>Lau</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Brodley</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Schmid</surname>
              <given-names>CH</given-names>
            </name>
          </person-group>
          <article-title>Semi-automated screening of biomedical citations for systematic reviews</article-title>
          <source>BMC Bioinformatics</source>
          <year>2010</year>
          <month>01</month>
          <day>26</day>
          <volume>11</volume>
          <issue>1</issue>
          <fpage>55</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcbioinformatics.biomedcentral.com/articles/10.1186/1471-2105-11-55"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/1471-2105-11-55</pub-id>
          <pub-id pub-id-type="medline">20102628</pub-id>
          <pub-id pub-id-type="pii">1471-2105-11-55</pub-id>
          <pub-id pub-id-type="pmcid">PMC2824679</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref64">
        <label>64</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Venus</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Jamrozik</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Evidence-poor medicine: just how evidence-based are Australian clinical practice guidelines?</article-title>
          <source>Intern Med J</source>
          <year>2020</year>
          <month>01</month>
          <day>14</day>
          <volume>50</volume>
          <issue>1</issue>
          <fpage>30</fpage>
          <lpage>37</lpage>
          <pub-id pub-id-type="doi">10.1111/imj.14466</pub-id>
          <pub-id pub-id-type="medline">31943616</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref65">
        <label>65</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lanera</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Berchialla</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Sharma</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Minto</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Gregori</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Baldi</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>Screening PubMed abstracts: is class imbalance always a challenge to machine learning?</article-title>
          <source>Syst Rev</source>
          <year>2019</year>
          <month>12</month>
          <day>06</day>
          <volume>8</volume>
          <issue>1</issue>
          <fpage>317</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://systematicreviewsjournal.biomedcentral.com/articles/10.1186/s13643-019-1245-8"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s13643-019-1245-8</pub-id>
          <pub-id pub-id-type="medline">31810495</pub-id>
          <pub-id pub-id-type="pii">10.1186/s13643-019-1245-8</pub-id>
          <pub-id pub-id-type="pmcid">PMC6896747</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref66">
        <label>66</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fernández-Delgado</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Cernadas</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Barro</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Amorim</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Do we need hundreds of classifiers to solve real world classification problems?</article-title>
          <source>J Mach Learn Res</source>
          <year>2014</year>
          <volume>15</volume>
          <issue>1</issue>
          <fpage>3181</fpage>
        </nlm-citation>
      </ref>
      <ref id="ref67">
        <label>67</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bekkar</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Djema</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Alitouche</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Evaluation measures for models assessment over imbalanced data sets</article-title>
          <source>J Inf Engineer Applic</source>
          <year>2013</year>
          <volume>3</volume>
          <fpage>27</fpage>
          <lpage>38</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://core.ac.uk/download/pdf/234677037.pdf"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref68">
        <label>68</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>YQ</given-names>
            </name>
            <name name-style="western">
              <surname>Chawla</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Krasser</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>SVMs modeling for highly imbalanced classification</article-title>
          <source>IEEE Trans Syst Man Cybern B</source>
          <year>2009</year>
          <month>02</month>
          <volume>39</volume>
          <issue>1</issue>
          <fpage>281</fpage>
          <lpage>288</lpage>
          <pub-id pub-id-type="doi">10.1109/tsmcb.2008.2002909</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref69">
        <label>69</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>O'Mara-Eves</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Thomas</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>McNaught</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Miwa</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ananiadou</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Using text mining for study identification in systematic reviews: a systematic review of current approaches</article-title>
          <source>Syst Rev</source>
          <year>2015</year>
          <month>01</month>
          <day>14</day>
          <volume>4</volume>
          <fpage>5</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://systematicreviewsjournal.biomedcentral.com/articles/10.1186/2046-4053-4-5"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/2046-4053-4-5</pub-id>
          <pub-id pub-id-type="medline">25588314</pub-id>
          <pub-id pub-id-type="pii">2046-4053-4-5</pub-id>
          <pub-id pub-id-type="pmcid">PMC4320539</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref70">
        <label>70</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shakeel</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Krüger</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Nostitz-Wallwitz</surname>
              <given-names>IV</given-names>
            </name>
            <name name-style="western">
              <surname>Saake</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Leich</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Automated selection and quality assessment of primary studies</article-title>
          <source>J Data Inf Qual</source>
          <year>2020</year>
          <month>01</month>
          <day>23</day>
          <volume>12</volume>
          <issue>1</issue>
          <fpage>1</fpage>
          <lpage>26</lpage>
          <pub-id pub-id-type="doi">10.1145/3356901</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref71">
        <label>71</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yoo</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Hu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Song</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>A coherent graph-based semantic clustering and summarization approach for biomedical literature and a new summarization evaluation method</article-title>
          <source>BMC Bioinformatics</source>
          <year>2007</year>
          <month>11</month>
          <day>27</day>
          <volume>8 Suppl 9</volume>
          <fpage>S4</fpage>
          <pub-id pub-id-type="doi">10.1186/1471-2105-8-S9-S4</pub-id>
          <pub-id pub-id-type="medline">18047705</pub-id>
          <pub-id pub-id-type="pii">1471-2105-8-S9-S4</pub-id>
          <pub-id pub-id-type="pmcid">PMC2217662</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref72">
        <label>72</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Arguello Casteleiro</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Maseda Fernandez</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Demetriou</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Read</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Fernandez Prieto</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Des Diz</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Nenadic</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Keane</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Stevens</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>A case study on sepsis using PubMed and deep learning for ontology learning</article-title>
          <source>Stud Health Technol Inform</source>
          <year>2017</year>
          <volume>235</volume>
          <fpage>516</fpage>
          <lpage>520</lpage>
          <pub-id pub-id-type="medline">28423846</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref73">
        <label>73</label>
        <nlm-citation citation-type="web">
          <source>EQUATOR Network: Reporting Guidelines</source>
          <access-date>2021-08-24</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.equator-network.org/reporting-guidelines/">https://www.equator-network.org/reporting-guidelines/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref74">
        <label>74</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rivera</surname>
              <given-names>SC</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Chan</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Denniston</surname>
              <given-names>AK</given-names>
            </name>
            <name name-style="western">
              <surname>Calvert</surname>
              <given-names>MJ</given-names>
            </name>
            <collab>SPIRIT-AI and CONSORT-AI Working Group</collab>
          </person-group>
          <article-title>Guidelines for clinical trial protocols for interventions involving artificial intelligence: the SPIRIT-AI Extension</article-title>
          <source>BMJ</source>
          <year>2020</year>
          <month>09</month>
          <day>09</day>
          <volume>370</volume>
          <fpage>m3210</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.bmj.com/lookup/pmidlookup?view=long&#38;pmid=32907797"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/bmj.m3210</pub-id>
          <pub-id pub-id-type="medline">32907797</pub-id>
          <pub-id pub-id-type="pmcid">PMC7490785</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref75">
        <label>75</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Watson</surname>
              <given-names>DS</given-names>
            </name>
            <name name-style="western">
              <surname>Krutzinna</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Bruce</surname>
              <given-names>IN</given-names>
            </name>
            <name name-style="western">
              <surname>Griffiths</surname>
              <given-names>CE</given-names>
            </name>
            <name name-style="western">
              <surname>McInnes</surname>
              <given-names>IB</given-names>
            </name>
            <name name-style="western">
              <surname>Barnes</surname>
              <given-names>MR</given-names>
            </name>
            <name name-style="western">
              <surname>Floridi</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Clinical applications of machine learning algorithms: beyond the black box</article-title>
          <source>BMJ</source>
          <year>2019</year>
          <month>03</month>
          <day>12</day>
          <volume>364</volume>
          <fpage>l886</fpage>
          <pub-id pub-id-type="doi">10.1136/bmj.l886</pub-id>
          <pub-id pub-id-type="medline">30862612</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref76">
        <label>76</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Ramsundar</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Feinberg</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Gomes</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Geniesse</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Pappu</surname>
              <given-names>AS</given-names>
            </name>
            <name name-style="western">
              <surname>Leswing</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Pande</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>MoleculeNet: a benchmark for molecular machine learning</article-title>
          <source>Chem Sci</source>
          <year>2018</year>
          <month>01</month>
          <day>14</day>
          <volume>9</volume>
          <issue>2</issue>
          <fpage>513</fpage>
          <lpage>530</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1039/c7sc02664a"/>
          </comment>
          <pub-id pub-id-type="doi">10.1039/c7sc02664a</pub-id>
          <pub-id pub-id-type="medline">29629118</pub-id>
          <pub-id pub-id-type="pii">c7sc02664a</pub-id>
          <pub-id pub-id-type="pmcid">PMC5868307</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref77">
        <label>77</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Devlin</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Toutanova</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>BERT: pre-training of deep bidirectional transformers for language understanding</article-title>
          <source>ArXiv.</source>
          <comment>Preprint posted online on October 10, 2018.
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://arxiv.org/abs/1810.04805"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref78">
        <label>78</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Yoon</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>So</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Kang</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>BioBERT: a pre-trained biomedical language representation model for biomedical text mining</article-title>
          <source>Bioinformatics</source>
          <year>2020</year>
          <month>02</month>
          <day>15</day>
          <volume>36</volume>
          <issue>4</issue>
          <fpage>1234</fpage>
          <lpage>1240</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/31501885"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/bioinformatics/btz682</pub-id>
          <pub-id pub-id-type="medline">31501885</pub-id>
          <pub-id pub-id-type="pii">5566506</pub-id>
          <pub-id pub-id-type="pmcid">PMC7703786</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
