<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">ResProt</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Res Protoc</journal-id>
      <journal-title>JMIR Research Protocols</journal-title>
      <issn pub-type="epub">1929-0748</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v10i11e29398</article-id>
      <article-id pub-id-type="pmid">34847061</article-id>
      <article-id pub-id-type="doi">10.2196/29398</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Protocol</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Protocol</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>A Deep Learning Approach to Refine the Identification of High-Quality Clinical Research Articles From the Biomedical Literature: Protocol for Algorithm Development and Validation</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Eysenbach</surname>
            <given-names>Gunther</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Michelson</surname>
            <given-names>Matthew</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Berchialla</surname>
            <given-names>Paola</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Thompson</surname>
            <given-names>Alison</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author">
          <name name-style="western">
            <surname>Abdelkader</surname>
            <given-names>Wael</given-names>
          </name>
          <degrees>MSc, MD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-9581-1521</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Navarro</surname>
            <given-names>Tamara</given-names>
          </name>
          <degrees>MLiS</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-2810-6942</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Parrish</surname>
            <given-names>Rick</given-names>
          </name>
          <degrees>Dip T</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-3809-6015</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Cotoi</surname>
            <given-names>Chris</given-names>
          </name>
          <degrees>BEng, EMBA</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-7029-0582</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Germini</surname>
            <given-names>Federico</given-names>
          </name>
          <degrees>MSc, MD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-0802-3616</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author">
          <name name-style="western">
            <surname>Linkins</surname>
            <given-names>Lori-Ann</given-names>
          </name>
          <degrees>MSc, MD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-9308-173X</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author">
          <name name-style="western">
            <surname>Iorio</surname>
            <given-names>Alfonso</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-3331-8766</ext-link>
        </contrib>
        <contrib id="contrib8" contrib-type="author">
          <name name-style="western">
            <surname>Haynes</surname>
            <given-names>R Brian</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-1453-3196</ext-link>
        </contrib>
        <contrib id="contrib9" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Ananiadou</surname>
            <given-names>Sophia</given-names>
          </name>
          <degrees>BA, DEA, PhD</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-4097-9191</ext-link>
        </contrib>
        <contrib id="contrib10" contrib-type="author">
          <name name-style="western">
            <surname>Chu</surname>
            <given-names>Lingyang</given-names>
          </name>
          <degrees>BSc, PhD</degrees>
          <xref rid="aff5" ref-type="aff">5</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-8937-1750</ext-link>
        </contrib>
        <contrib id="contrib11" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Lokker</surname>
            <given-names>Cynthia</given-names>
          </name>
          <degrees>MSc, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Health Information Research Unit</institution>
            <institution>Department of Health Research Methods, Evidence, and Impact</institution>
            <institution>McMaster University</institution>
            <addr-line>1280 Main St W, CRL-137</addr-line>
            <addr-line>Hamilton, ON, L8S 4K1</addr-line>
            <country>Canada</country>
            <phone>1 9055259140 ext 22208</phone>
            <email>lokkerc@mcmaster.ca</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-2436-4290</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Health Information Research Unit</institution>
        <institution>Department of Health Research Methods, Evidence, and Impact</institution>
        <institution>McMaster University</institution>
        <addr-line>Hamilton, ON</addr-line>
        <country>Canada</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Department of Medicine</institution>
        <institution>McMaster University</institution>
        <addr-line>Hamilton, ON</addr-line>
        <country>Canada</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Department of Computer Science</institution>
        <institution>University of Manchester</institution>
        <addr-line>Manchester</addr-line>
        <country>United Kingdom</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>The Alan Turing Institute</institution>
        <addr-line>London</addr-line>
        <country>United Kingdom</country>
      </aff>
      <aff id="aff5">
        <label>5</label>
        <institution>Department of Computing and Software</institution>
        <institution>Faculty of Engineering</institution>
        <institution>McMaster University</institution>
        <addr-line>Hamilton, ON</addr-line>
        <country>Canada</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Cynthia Lokker <email>lokkerc@mcmaster.ca</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <month>11</month>
        <year>2021</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>29</day>
        <month>11</month>
        <year>2021</year>
      </pub-date>
      <volume>10</volume>
      <issue>11</issue>
      <elocation-id>e29398</elocation-id>
      <history>
        <date date-type="received">
          <day>7</day>
          <month>4</month>
          <year>2021</year>
        </date>
        <date date-type="rev-request">
          <day>25</day>
          <month>5</month>
          <year>2021</year>
        </date>
        <date date-type="rev-recd">
          <day>24</day>
          <month>8</month>
          <year>2021</year>
        </date>
        <date date-type="accepted">
          <day>17</day>
          <month>9</month>
          <year>2021</year>
        </date>
      </history>
      <copyright-statement>©Wael Abdelkader, Tamara Navarro, Rick Parrish, Chris Cotoi, Federico Germini, Lori-Ann Linkins, Alfonso Iorio, R Brian Haynes, Sophia Ananiadou, Lingyang Chu, Cynthia Lokker. Originally published in JMIR Research Protocols (https://www.researchprotocols.org), 29.11.2021.</copyright-statement>
      <copyright-year>2021</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Research Protocols, is properly cited. The complete bibliographic information, a link to the original publication on https://www.researchprotocols.org, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://www.researchprotocols.org/2021/11/e29398" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>A barrier to practicing evidence-based medicine is the rapidly increasing body of biomedical literature. Use of method terms to limit the search can help reduce the burden of screening articles for clinical relevance; however, such terms are limited by their partial dependence on indexing terms and usually produce low precision, especially when high sensitivity is required. Machine learning has been applied to the identification of high-quality literature with the potential to achieve high precision without sacrificing sensitivity. The use of artificial intelligence has shown promise to improve the efficiency of identifying sound evidence.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>The primary objective of this research is to derive and validate deep learning machine models using iterations of Bidirectional Encoder Representations from Transformers (BERT) to retrieve high-quality, high-relevance evidence for clinical consideration from the biomedical literature.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>Using the HuggingFace Transformers library, we will experiment with variations of BERT models, including BERT, BioBERT, BlueBERT, and PubMedBERT, to determine which have the best performance in article identification based on quality criteria. Our experiments will utilize a large data set of over 150,000 PubMed citations from 2012 to 2020 that have been manually labeled based on their methodological rigor for clinical use. We will evaluate and report on the performance of the classifiers in categorizing articles based on their likelihood of meeting quality criteria. We will report fine-tuning hyperparameters for each model, as well as their performance metrics, including recall (sensitivity), specificity, precision, accuracy, F-score, the number of articles that need to be read before finding one that is positive (meets criteria), and classification probability scores.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>Initial model development is underway, with further development planned for early 2022. Performance testing is expected to star in February 2022. Results will be published in 2022.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>The experiments will aim to improve the precision of retrieving high-quality articles by applying a machine learning classifier to PubMed searching.</p>
        </sec>
        <sec sec-type="registered-report">
          <title>International Registered Report Identifier (IRRID)</title>
          <p>DERR1-10.2196/29398</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>bioinformatics</kwd>
        <kwd>machine learning</kwd>
        <kwd>evidence-based medicine</kwd>
        <kwd>literature retrieval</kwd>
        <kwd>medical informatics</kwd>
        <kwd>natural language processing</kwd>
        <kwd>NLP</kwd>
        <kwd>biomedical</kwd>
        <kwd>literature</kwd>
        <kwd>literature surveillance</kwd>
        <kwd>model development</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <sec>
        <title>Background</title>
        <p>The biomedical literature grows exponentially every year. According to the latest National Library of Medicine statistical report, more than 1.5 million new citations were indexed in PubMed in 2020 alone [<xref ref-type="bibr" rid="ref1">1</xref>]. This high volume of literature is fed by the publication of at least 1 new article every 26 seconds [<xref ref-type="bibr" rid="ref2">2</xref>] and 95 clinical trials per day [<xref ref-type="bibr" rid="ref3">3</xref>]. Nevertheless, only 1% of published clinical studies meet the criteria for high scientific quality for use in health care decisions [<xref ref-type="bibr" rid="ref4">4</xref>], driving the need for efficient and accurate approaches to identify clinical studies that have been conducted with methodological rigor.</p>
        <p>Methodological search filters like PubMed Clinical Queries [<xref ref-type="bibr" rid="ref5">5</xref>] are considered the cornerstone for information retrieval in evidence-based practice [<xref ref-type="bibr" rid="ref6">6</xref>]. These and other search filters have been developed using a diagnostic testing procedure [<xref ref-type="bibr" rid="ref7">7</xref>] to optimize sensitivity or specificity, or the best balance between the two, for such clinical study categories as treatment, diagnosis, prognosis, etiology, and clinical prediction guides [<xref ref-type="bibr" rid="ref8">8</xref>]. Some search filters are limited by their partial reliance on MeSH (Medical Subject Headings) indexing terms, as it can take up to a year for articles to be indexed in MEDLINE [<xref ref-type="bibr" rid="ref9">9</xref>]. Despite having highly sensitive search filters, with an aim to optimize specificity—essentially returning the most likely relevant articles while reducing the need to assess off-target articles—they also return large numbers of articles that are not on target.</p>
        <p>Most search filters have been developed using databases of articles that have been tagged for clinical category and methodological rigor and using a diagnostic test approach to detect true and false, positive (on-target) and negative (off-target) articles [<xref ref-type="bibr" rid="ref10">10</xref>]. The development of such a gold standard is costly and time-consuming, requiring highly trained staff. The Clinical Hedges database, developed at McMaster University, has been used as the gold standard for new search strategy development [<xref ref-type="bibr" rid="ref11">11</xref>-<xref ref-type="bibr" rid="ref14">14</xref>].</p>
        <p>Machine learning is a subset of artificial intelligence referring to the application of computational methods to improve performance or achieve precise predictions via experience. Experience, in this context, is the information given to the machine for analysis [<xref ref-type="bibr" rid="ref15">15</xref>]. Machine learning applications in the biomedical literature have been explored by many researchers over the years. In 2007, Yoo and colleagues [<xref ref-type="bibr" rid="ref16">16</xref>] applied a novel machine learning approach for document clustering and text summarization, producing a textual summary of the information by automatically extracting the most relevant text content from a document cluster. Machine learning has also been applied to the ranking of biomedical publications. In 2009, the MedlineRanker webserver ranked citations in a data set based on their relevance to a given topic [<xref ref-type="bibr" rid="ref17">17</xref>]. Other applications of machine learning include accurately predicting the citation count of a given article at the time of its publication to determine its scientific impact using a support vector machine (SVM) context–based classifier [<xref ref-type="bibr" rid="ref18">18</xref>] and automating the systematic review screening process to decrease the screening workload [<xref ref-type="bibr" rid="ref19">19</xref>]. For example, Miwa and colleagues [<xref ref-type="bibr" rid="ref20">20</xref>] used an SVM pool–based active machine learning model to classify articles as relevant for inclusion in a systematic review. Miwa et al's [<xref ref-type="bibr" rid="ref20">20</xref>] experiment used “certainty” as a criterion for article selection, which is effective in dealing with imbalanced data sets. An improvement in topic detection was proposed by Hashimoto et al [<xref ref-type="bibr" rid="ref21">21</xref>] as they used a neural network model based on paragraph vectors capturing semantic similarities between words and documents. Paragraph vectors can accurately determine semantic relatedness between textual units of varying lengths, that is, words, phrases, and longer sequences (eg, sentences, paragraphs, and documents). Methods that consider factors such as word order within the text yield superior performance [<xref ref-type="bibr" rid="ref21">21</xref>].</p>
        <p>Recent advancement in natural language processing (NLP) is attributed to the development of pretrained language models (PTLMs) [<xref ref-type="bibr" rid="ref22">22</xref>]. PTLMs transfer learning from training on one data set to the performance of different NLP functions on a new data set [<xref ref-type="bibr" rid="ref22">22</xref>,<xref ref-type="bibr" rid="ref23">23</xref>]. PTLMs provide more stable predictions and better model generalization [<xref ref-type="bibr" rid="ref24">24</xref>]. PTLMs are applied using one of two main strategies: feature-based or fine-tuning models [<xref ref-type="bibr" rid="ref23">23</xref>]. Feature-based approaches use task-specific architectures that include the pretrained representations as additional features, such as Embedding from Language Models (ELMo) [<xref ref-type="bibr" rid="ref22">22</xref>,<xref ref-type="bibr" rid="ref25">25</xref>]. Fine-tuning approaches attempt to pretrain the language model using general-domain text, then fine-tune the model on the target data and target task [<xref ref-type="bibr" rid="ref22">22</xref>]. Fine-tuning language models are considered the mainstream for PTLM adaption [<xref ref-type="bibr" rid="ref22">22</xref>]. Examples of fine-tuning approaches are Universal Language Model Fine-Tuning [<xref ref-type="bibr" rid="ref26">26</xref>] and Bidirectional Encoder Representations from Transformers (BERT) [<xref ref-type="bibr" rid="ref23">23</xref>]. The bidirectional approach used in BERT improves its performance in understanding text context over other PTLMs, making it the state-of-the-art model. BERT can be used for multiple NLP tasks, including text summarization, retrieval, question answers, named entity recognition, and document classification [<xref ref-type="bibr" rid="ref27">27</xref>].</p>
        <p>Over the past two decades, machine learning has been applied to classify the biomedical literature based on methodological rigor and evidence quality. For such classification tasks, supervised machine learning approaches in which the training data is labeled based on a selected high-quality standard are most commonly used [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref28">28</xref>-<xref ref-type="bibr" rid="ref32">32</xref>]. The first reported experiments to classify biomedical literature based on quality by Aphinyanaphongs and colleagues relied on the American College of Physicians Journal Club as their high-quality training standard and used a supervised SVM as a classifier [<xref ref-type="bibr" rid="ref28">28</xref>-<xref ref-type="bibr" rid="ref30">30</xref>]. The most recent study to classify high-quality articles was conducted by Afzal and colleagues [<xref ref-type="bibr" rid="ref31">31</xref>] and applied an artificial neural network using data gathered from the Cochrane Library as their high-quality standard. By using supervised approaches, the model development was informed by decisions made by the researchers.</p>
      </sec>
      <sec>
        <title>Objectives</title>
        <p>The primary objective of this research is to derive and validate deep learning models using variations of BERT to retrieve high-quality, high-relevance evidence for clinical consideration from the biomedical literature; models will be trained using a large, tagged database of high-quality, high-relevance clinical articles.</p>
      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Quality Standard Derivation</title>
        <p>At McMaster University, the Health Information Research Unit (HiRU) has an established reputation for retrieval, appraisal, classification, organization, and dissemination of health-related research. Through the Knowledge Refinery, the unit daily screens research studies from over 120 clinical journals and identifies those that meet methodological rigor for original studies, systematic reviews, pooled original studies, and evidence-based guidelines within the categories of treatment, primary prevention, diagnosis, harm from medical interventions, economics, prognosis, clinical prediction, and quality improvement [<xref ref-type="bibr" rid="ref33">33</xref>]. The steps in the process include the initial filtering of all journal articles using highly sensitive search filters (&#62;99%) developed by HiRU to identify articles that fit the categories named above. This filtered subset is then manually reviewed by skilled research associates and a clinical editor. In this project, “rigor” is defined as meeting all the methodological criteria explicitly described on the HiRU website and in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> [<xref ref-type="bibr" rid="ref34">34</xref>]. The process of selecting clinically relevant articles is further described by Haynes et al [<xref ref-type="bibr" rid="ref35">35</xref>], and the high reliability of the critical appraisal step has been documented with a kappa value of over 80% for all categories of articles [<xref ref-type="bibr" rid="ref36">36</xref>].</p>
        <p>The Premium Literature Service (PLUS) process is based on scientific principles for critical appraisal of the medical literature to support evidence-based medicine, combined with multiple ratings of clinical relevance by a worldwide network of practicing health care professionals. Segments of the database have been used many times to test various machine learning approaches, including deep learning [<xref ref-type="bibr" rid="ref3">3</xref>]. A vast community of &#62;4000 clinicians then rate methodologically rigorous articles for clinical relevance and newsworthiness [<xref ref-type="bibr" rid="ref37">37</xref>]. The resulting PLUS database contains a distillation of the most reliable and relevant published clinical research [<xref ref-type="bibr" rid="ref38">38</xref>].</p>
      </sec>
      <sec>
        <title>Data Set</title>
        <p>The data used is the Critical Appraisal Process (CAP) data set, which consists of the titles and abstracts of 155,679 articles published between 2012 to 2020, identified by means of their PubMed identifier and manually labeled by research associates as those that “fulfilled” methodological rigor criteria (n=30,035) or “failed” to meet methodological rigor criteria (n=125,644). The data set will be randomly split into 80% for training, 10% for validation, and 10% for testing. Along with being unbalanced, the CAP data set is large and computationally challenging for deep learning model development. To overcome this limitation, we will first convert the data set into multiple balanced subsets, then independently train one model per each of the balanced subsets and use ensembling techniques [<xref ref-type="bibr" rid="ref39">39</xref>-<xref ref-type="bibr" rid="ref42">42</xref>] to combine the independently trained models into a better model with more robust performance.</p>
      </sec>
      <sec>
        <title>Machine Learning Experiment</title>
        <p>Using Python (Python Software Foundation), we will build our models using the HuggingFace Transformers library [<xref ref-type="bibr" rid="ref43">43</xref>]. HuggingFace is an open-source NLP and artificial intelligence model hub that provides accessible and implementable state-of-the-art models to the community [<xref ref-type="bibr" rid="ref44">44</xref>]. Using PTLMs available within the HuggingFace Transformers library, we will experiment with variations of BERT models to determine which have the best performance in article classification. These will include BERT [<xref ref-type="bibr" rid="ref23">23</xref>], BioBERT [<xref ref-type="bibr" rid="ref45">45</xref>], BlueBERT [<xref ref-type="bibr" rid="ref46">46</xref>], and PubMedBERT [<xref ref-type="bibr" rid="ref47">47</xref>]. These models differ in the pretraining text domain. Pretraining a biomedical BERT model follows a mixed-domain pretraining that initializes with standard BERT pretraining using text data from BookCorpus [<xref ref-type="bibr" rid="ref48">48</xref>] and English Wikipedia (Wikimedia Foundation) [<xref ref-type="bibr" rid="ref23">23</xref>], followed by continuous pretraining using biomedical text. BioBERT is pretrained using PubMed abstracts and PubMed Central full-text articles [<xref ref-type="bibr" rid="ref45">45</xref>], while BlueBERT is pretrained using PubMed text and clinical notes from MIMIC-III (Medical Information Mart for Intensive Care) [<xref ref-type="bibr" rid="ref46">46</xref>]. PubMedBERT is pretrained using domain-specific text data from a collection of 14 million PubMed abstracts, which were downloaded in February 2020, with abstracts under 128 words removed [<xref ref-type="bibr" rid="ref47">47</xref>]. Our selection of these models was guided by their availability within the HuggingFace repository and their reported performance in the Biomedical Language Understanding and Reasoning Benchmark leaderboard [<xref ref-type="bibr" rid="ref47">47</xref>,<xref ref-type="bibr" rid="ref49">49</xref>].</p>
        <p>For the top-performing model that maintains sensitivity &#62;98%, we plan to prospectively validate its real-world performance in the McMaster PLUS reading process. A random sample of incoming articles that are classified as failed articles will be allocated to research staff blinded to the model determination.</p>
        <p>To evaluate the performance of machine learning models, we will report the sensitivity (recall), specificity, accuracy, precision, the number of articles that need to be read before finding one that is positive, and F-score (harmonic mean of recall and precision metrics [<xref ref-type="bibr" rid="ref50">50</xref>]) (<xref ref-type="table" rid="table1">Table 1</xref>). We will report the probability score threshold, with corresponding 95% CIs, for each model. The machine learning models return a probability score for each article that represents the probability that the article is of high quality, and ranges from 0 (does not meet criteria) to 1 (meets criteria). For a given article, the probability will vary depending on the composition of the model. To prospectively validate the performance of the best model, we will report the same diagnostic characteristics for prospective validation of the model. Fine-tuning hyperparameter settings (number of epochs, learning rate, batch size, and number of random seeds) of the selected models for validation will be reported.</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Definitions and formulas pertaining to performance metrics.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="200"/>
            <col width="520"/>
            <col width="280"/>
            <thead>
              <tr valign="top">
                <td>Measure</td>
                <td>Definition</td>
                <td>Formula</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Recall (sensitivity)</td>
                <td>The proportion of correctly identified positive articles fulfilling criteria among those predicted to be positive</td>
                <td>TP<sup>a</sup>/(TP+FN<sup>b</sup>)</td>
              </tr>
              <tr valign="top">
                <td>Specificity</td>
                <td>The proportion of articles correctly identified as not meeting criteria among those predicted as negative</td>
                <td>TN<sup>c</sup>/(TN+FP<sup>d</sup>)</td>
              </tr>
              <tr valign="top">
                <td>Precision</td>
                <td>The proportion of correctly identified positives among all classified positives</td>
                <td>TP/(TP+FP)</td>
              </tr>
              <tr valign="top">
                <td>F-measure</td>
                <td>Harmonic mean of precision and recall</td>
                <td>2 × ([precision × recall]/[precision + recall])</td>
              </tr>
              <tr valign="top">
                <td>Accuracy</td>
                <td>The number of correctly predicted documents out of all classified documents</td>
                <td>(TP+TN)/(TP+FP+FN+TN)</td>
              </tr>
              <tr valign="top">
                <td>Number needed to read</td>
                <td>The number of articles that need to be read before finding one that is positive (meets criteria)</td>
                <td>1/precision</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>TP: true positive.</p>
            </fn>
            <fn id="table1fn2">
              <p><sup>b</sup>FN: false negative.</p>
            </fn>
            <fn id="table1fn3">
              <p><sup>c</sup>TN: true negative.</p>
            </fn>
            <fn id="table1fn4">
              <p><sup>d</sup>FP: false positive.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <p>Initial model development is underway, with further development planned for early 2022. Performance testing is expected to start in February 2022. Results will be published in 2022.</p>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <p>BERT is considered the state-of-the-art model for NLP. To our knowledge, this is the first experiment to investigate the use of PTLMs in the identification of high-quality articles from the biomedical literature [<xref ref-type="bibr" rid="ref51">51</xref>]. Our study leverages a large data set of over 150,000 citations that have been manually tagged by experienced research associates, making it one of the few reliable sources for training machine learning models to identify high-quality clinical literature [<xref ref-type="bibr" rid="ref50">50</xref>]. Our application and analysis of BERT models may provide a better performing automation model suitable for incorporation in literature surveillance processes at HiRU and elsewhere.</p>
      <p>Artificial intelligence and machine learning applications are complex and known for their black-box nature, providing predictions without enough explanation [<xref ref-type="bibr" rid="ref52">52</xref>]. Besides the accurate prediction and the decrease in workload, trust in algorithmic decisions is essential, especially in medicine and health care research [<xref ref-type="bibr" rid="ref53">53</xref>]. To overcome the lack of transparency, interpreting machine learning models and their decision-making process has become a growing focus among academic and industrial machine learning experts [<xref ref-type="bibr" rid="ref54">54</xref>]. Next steps include interpreting the decisions made by the model. This would allow us to understand the justification behind model decision-making [<xref ref-type="bibr" rid="ref55">55</xref>].</p>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Inclusion criteria for articles meeting methodological rigor.</p>
        <media xlink:href="resprot_v10i11e29398_app1.docx" xlink:title="DOCX File , 24 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">BERT</term>
          <def>
            <p>Bidirectional Encoder Representations from Transformers</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">CAP</term>
          <def>
            <p>Critical Appraisal Process</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">HiRU</term>
          <def>
            <p>Health Information Research Unit</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">MeSH</term>
          <def>
            <p>Medical Subject Headings</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">MIMIC-III</term>
          <def>
            <p>Medical Information Mart for Intensive Care</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">NLP</term>
          <def>
            <p>natural language processing</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">PLUS</term>
          <def>
            <p>Premium Literature Service</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">PTLM</term>
          <def>
            <p>pretrained language model</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb9">SVM</term>
          <def>
            <p>support vector machine</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="web">
          <article-title>MEDLINE PubMed Production Statistics</article-title>
          <source>National Library of Medicine</source>
          <year>2020</year>
          <access-date>2021-07-31</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.nlm.nih.gov/bsd/medline_pubmed_production_stats.html">https://www.nlm.nih.gov/bsd/medline_pubmed_production_stats.html</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Garba</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Ahmed</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Mai</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Makama</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Odigie</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>Proliferations of scientific medical journals: a burden or a blessing</article-title>
          <source>Oman Med J</source>
          <year>2010</year>
          <month>10</month>
          <volume>25</volume>
          <issue>4</issue>
          <fpage>311</fpage>
          <lpage>4</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/22043365"/>
          </comment>
          <pub-id pub-id-type="doi">10.5001/omj.2010.89</pub-id>
          <pub-id pub-id-type="medline">22043365</pub-id>
          <pub-id pub-id-type="pii">OMJ-D-10-00052</pub-id>
          <pub-id pub-id-type="pmcid">PMC3191655</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Del Fiol</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Michelson</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Iorio</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Cotoi</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Haynes</surname>
              <given-names>RB</given-names>
            </name>
          </person-group>
          <article-title>A Deep Learning Method to Automatically Identify Reports of Scientifically Rigorous Clinical Research from the Biomedical Literature: Comparative Analytic Study</article-title>
          <source>J Med Internet Res</source>
          <year>2018</year>
          <month>06</month>
          <day>25</day>
          <volume>20</volume>
          <issue>6</issue>
          <fpage>e10281</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2018/6/e10281/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/10281</pub-id>
          <pub-id pub-id-type="medline">29941415</pub-id>
          <pub-id pub-id-type="pii">v20i6e10281</pub-id>
          <pub-id pub-id-type="pmcid">PMC6037944</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Haynes</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Where's the meat in clinical journals?</article-title>
          <source>ACP Journal Club</source>
          <year>1993</year>
          <volume>119</volume>
          <issue>3</issue>
          <fpage>A22</fpage>
          <pub-id pub-id-type="doi">10.7326/ACPJC-1993-119-3-A22</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wilczynski</surname>
              <given-names>NL</given-names>
            </name>
            <name name-style="western">
              <surname>McKibbon</surname>
              <given-names>KA</given-names>
            </name>
            <name name-style="western">
              <surname>Walter</surname>
              <given-names>SD</given-names>
            </name>
            <name name-style="western">
              <surname>Garg</surname>
              <given-names>AX</given-names>
            </name>
            <name name-style="western">
              <surname>Haynes</surname>
              <given-names>RB</given-names>
            </name>
          </person-group>
          <article-title>MEDLINE clinical queries are robust when searching in recent publishing years</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2013</year>
          <volume>20</volume>
          <issue>2</issue>
          <fpage>363</fpage>
          <lpage>8</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/23019242"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/amiajnl-2012-001075</pub-id>
          <pub-id pub-id-type="medline">23019242</pub-id>
          <pub-id pub-id-type="pii">amiajnl-2012-001075</pub-id>
          <pub-id pub-id-type="pmcid">PMC3638187</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bachmann</surname>
              <given-names>LM</given-names>
            </name>
            <name name-style="western">
              <surname>Coray</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Estermann</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Ter Riet</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Identifying diagnostic studies in MEDLINE: reducing the number needed to read</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2002</year>
          <volume>9</volume>
          <issue>6</issue>
          <fpage>653</fpage>
          <lpage>8</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/12386115"/>
          </comment>
          <pub-id pub-id-type="doi">10.1197/jamia.m1124</pub-id>
          <pub-id pub-id-type="medline">12386115</pub-id>
          <pub-id pub-id-type="pmcid">PMC349381</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wilczynski</surname>
              <given-names>NL</given-names>
            </name>
            <name name-style="western">
              <surname>Morgan</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Haynes</surname>
              <given-names>RB</given-names>
            </name>
            <collab>Hedges Team</collab>
          </person-group>
          <article-title>An overview of the design and methods for retrieving high-quality studies for clinical care</article-title>
          <source>BMC Med Inform Decis Mak</source>
          <year>2005</year>
          <month>06</month>
          <day>21</day>
          <volume>5</volume>
          <fpage>20</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedinformdecismak.biomedcentral.com/articles/10.1186/1472-6947-5-20"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/1472-6947-5-20</pub-id>
          <pub-id pub-id-type="medline">15969765</pub-id>
          <pub-id pub-id-type="pii">1472-6947-5-20</pub-id>
          <pub-id pub-id-type="pmcid">PMC1183213</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="web">
          <article-title>Hedges</article-title>
          <source>Health Information Research Unit - McMaster University</source>
          <year>2016</year>
          <access-date>2021-11-18</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://hiru.mcmaster.ca/hiru/HIRU_Hedges_home.aspx">https://hiru.mcmaster.ca/hiru/HIRU_Hedges_home.aspx</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Irwin</surname>
              <given-names>AN</given-names>
            </name>
            <name name-style="western">
              <surname>Rackham</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Comparison of the time-to-indexing in PubMed between biomedical journals according to impact factor, discipline, and focus</article-title>
          <source>Res Social Adm Pharm</source>
          <year>2017</year>
          <volume>13</volume>
          <issue>2</issue>
          <fpage>389</fpage>
          <lpage>393</lpage>
          <pub-id pub-id-type="doi">10.1016/j.sapharm.2016.04.006</pub-id>
          <pub-id pub-id-type="medline">27215603</pub-id>
          <pub-id pub-id-type="pii">S1551-7411(16)30019-5</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wong</surname>
              <given-names>SS</given-names>
            </name>
            <name name-style="western">
              <surname>Wilczynski</surname>
              <given-names>NL</given-names>
            </name>
            <name name-style="western">
              <surname>Haynes</surname>
              <given-names>RB</given-names>
            </name>
            <name name-style="western">
              <surname>Ramkissoonsingh</surname>
              <given-names>R</given-names>
            </name>
            <collab>Hedges Team</collab>
          </person-group>
          <article-title>Developing optimal search strategies for detecting sound clinical prediction studies in MEDLINE</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2003</year>
          <fpage>728</fpage>
          <lpage>32</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/14728269"/>
          </comment>
          <pub-id pub-id-type="medline">14728269</pub-id>
          <pub-id pub-id-type="pii">D030003013</pub-id>
          <pub-id pub-id-type="pmcid">PMC1479983</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Geersing</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Bouwmeester</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Zuithoff</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Spijker</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Leeflang</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Moons</surname>
              <given-names>KGM</given-names>
            </name>
            <name name-style="western">
              <surname>Moons</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Search filters for finding prognostic and diagnostic prediction studies in Medline to enhance systematic reviews</article-title>
          <source>PLoS One</source>
          <year>2012</year>
          <volume>7</volume>
          <issue>2</issue>
          <fpage>e32844</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0032844"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0032844</pub-id>
          <pub-id pub-id-type="medline">22393453</pub-id>
          <pub-id pub-id-type="pii">PONE-D-11-19528</pub-id>
          <pub-id pub-id-type="pmcid">PMC3290602</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Frazier</surname>
              <given-names>JJ</given-names>
            </name>
            <name name-style="western">
              <surname>Stein</surname>
              <given-names>CD</given-names>
            </name>
            <name name-style="western">
              <surname>Tseytlin</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Bekhuis</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Building a gold standard to construct search filters: a case study with biomarkers for oral cancer</article-title>
          <source>J Med Libr Assoc</source>
          <year>2015</year>
          <month>01</month>
          <volume>103</volume>
          <issue>1</issue>
          <fpage>22</fpage>
          <lpage>30</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/25552941"/>
          </comment>
          <pub-id pub-id-type="doi">10.3163/1536-5050.103.1.005</pub-id>
          <pub-id pub-id-type="medline">25552941</pub-id>
          <pub-id pub-id-type="pii">JMLA-D-14-00011</pub-id>
          <pub-id pub-id-type="pmcid">PMC4279929</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Keogh</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Wallace</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>O'Brien</surname>
              <given-names>KK</given-names>
            </name>
            <name name-style="western">
              <surname>Murphy</surname>
              <given-names>PJ</given-names>
            </name>
            <name name-style="western">
              <surname>Teljeur</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>McGrath</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Doherty</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Dimitrov</surname>
              <given-names>BD</given-names>
            </name>
            <name name-style="western">
              <surname>Fahey</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Optimized retrieval of primary care clinical prediction rules from MEDLINE to establish a Web-based register</article-title>
          <source>J Clin Epidemiol</source>
          <year>2011</year>
          <month>08</month>
          <volume>64</volume>
          <issue>8</issue>
          <fpage>848</fpage>
          <lpage>60</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jclinepi.2010.11.011</pub-id>
          <pub-id pub-id-type="medline">21411285</pub-id>
          <pub-id pub-id-type="pii">S0895-4356(10)00423-3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Dobbins</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Decorby</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>McRae</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Tirilis</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Husson</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>An optimal search filter for retrieving systematic reviews and meta-analyses</article-title>
          <source>BMC Med Res Methodol</source>
          <year>2012</year>
          <month>04</month>
          <day>18</day>
          <volume>12</volume>
          <fpage>51</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedresmethodol.biomedcentral.com/articles/10.1186/1471-2288-12-51"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/1471-2288-12-51</pub-id>
          <pub-id pub-id-type="medline">22512835</pub-id>
          <pub-id pub-id-type="pii">1471-2288-12-51</pub-id>
          <pub-id pub-id-type="pmcid">PMC3515398</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mohri</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Rostamizadeh</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Talwalkar</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <source>Foundations of Machine Learning, 2nd ed</source>
          <year>2018</year>
          <publisher-loc>Cambridge, MA</publisher-loc>
          <publisher-name>MIT Press</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yoo</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Hu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Song</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>A coherent graph-based semantic clustering and summarization approach for biomedical literature and a new summarization evaluation method</article-title>
          <source>BMC Bioinformatics</source>
          <year>2007</year>
          <month>11</month>
          <day>27</day>
          <volume>8 Suppl 9</volume>
          <fpage>S4</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcbioinformatics.biomedcentral.com/articles/10.1186/1471-2105-8-S9-S4"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/1471-2105-8-S9-S4</pub-id>
          <pub-id pub-id-type="medline">18047705</pub-id>
          <pub-id pub-id-type="pii">1471-2105-8-S9-S4</pub-id>
          <pub-id pub-id-type="pmcid">PMC2217662</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fontaine</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Barbosa-Silva</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Schaefer</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Huska</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Muro</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Andrade-Navarro</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>MedlineRanker: flexible ranking of biomedical literature</article-title>
          <source>Nucleic Acids Res</source>
          <year>2009</year>
          <month>07</month>
          <volume>37</volume>
          <issue>Web Server issue</issue>
          <fpage>W141</fpage>
          <lpage>6</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/19429696"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/nar/gkp353</pub-id>
          <pub-id pub-id-type="medline">19429696</pub-id>
          <pub-id pub-id-type="pii">gkp353</pub-id>
          <pub-id pub-id-type="pmcid">PMC2703945</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fu</surname>
              <given-names>LD</given-names>
            </name>
            <name name-style="western">
              <surname>Aliferis</surname>
              <given-names>CF</given-names>
            </name>
          </person-group>
          <article-title>Using content-based and bibliometric features for machine learning models to predict citation counts in the biomedical literature</article-title>
          <source>Scientometrics</source>
          <year>2010</year>
          <month>2</month>
          <day>3</day>
          <volume>85</volume>
          <issue>1</issue>
          <fpage>257</fpage>
          <lpage>270</lpage>
          <pub-id pub-id-type="doi">10.1007/s11192-010-0160-5</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>O'Mara-Eves</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Thomas</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>McNaught</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Miwa</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ananiadou</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Using text mining for study identification in systematic reviews: a systematic review of current approaches</article-title>
          <source>Syst Rev</source>
          <year>2015</year>
          <month>01</month>
          <day>14</day>
          <volume>4</volume>
          <issue>1</issue>
          <fpage>5</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://systematicreviewsjournal.biomedcentral.com/articles/10.1186/2046-4053-4-5"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/2046-4053-4-5</pub-id>
          <pub-id pub-id-type="medline">25588314</pub-id>
          <pub-id pub-id-type="pii">2046-4053-4-5</pub-id>
          <pub-id pub-id-type="pmcid">PMC4320539</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Miwa</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Thomas</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>O'Mara-Eves</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ananiadou</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Reducing systematic review workload through certainty-based screening</article-title>
          <source>J Biomed Inform</source>
          <year>2014</year>
          <month>10</month>
          <volume>51</volume>
          <fpage>242</fpage>
          <lpage>53</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(14)00143-9"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2014.06.005</pub-id>
          <pub-id pub-id-type="medline">24954015</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(14)00143-9</pub-id>
          <pub-id pub-id-type="pmcid">PMC4199186</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hashimoto</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Kontonatsios</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Miwa</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ananiadou</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Topic detection using paragraph vectors to support active learning in systematic reviews</article-title>
          <source>J Biomed Inform</source>
          <year>2016</year>
          <month>08</month>
          <volume>62</volume>
          <fpage>59</fpage>
          <lpage>65</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(16)30044-2"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2016.06.001</pub-id>
          <pub-id pub-id-type="medline">27293211</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(16)30044-2</pub-id>
          <pub-id pub-id-type="pmcid">PMC4981645</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Qiu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Shao</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Dai</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>X</given-names>
            </name>
          </person-group>
          <article-title>Pre-trained models for natural language processing: A survey</article-title>
          <source>Sci China Technol Sci</source>
          <year>2020</year>
          <month>09</month>
          <day>15</day>
          <volume>63</volume>
          <issue>10</issue>
          <fpage>1872</fpage>
          <lpage>1897</lpage>
          <pub-id pub-id-type="doi">10.1007/s11431-020-1647-3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Devlin</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>M-W</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Toutanova</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>BERT: Pre-training of deep bidirectional transformers for language understanding</article-title>
          <source>arXiv</source>
          <comment>Preprint posted online Oct 1, 2018
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://arxiv.org/abs/1810.04805"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dai</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Le</surname>
              <given-names>QV</given-names>
            </name>
          </person-group>
          <article-title>Semi-supervised Sequence Learning</article-title>
          <source>arXiv</source>
          <comment>Preprint posted online Nov 4, 2015
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://arxiv.org/abs/1511.01432"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Peters</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Neumann</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Iyyer</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Gardner</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Clark</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Zettlemoyer</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Deep contextualized word representations</article-title>
          <source>arXiv</source>
          <comment>Preprint posted online Feb 14, 2018
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://arxiv.org/abs/1802.05365"/>
          </comment>
          <pub-id pub-id-type="doi">10.18653/v1/n18-1202</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Howard</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Ruder</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Universal Language Model Fine-tuning for Text Classification</article-title>
          <source>arXiv</source>
          <comment>Preprint posted online Jan 18, 2018
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://arxiv.org/abs/1801.06146"/>
          </comment>
          <pub-id pub-id-type="doi">10.18653/v1/p18-1031</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Adhikari</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ram</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>DocBERT: BERT for Document Classification</article-title>
          <source>arXiv</source>
          <comment>Preprint posted online Apr 17, 2019
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://arxiv.org/abs/1904.08398"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Aphinyanaphongs</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Aliferis</surname>
              <given-names>CF</given-names>
            </name>
          </person-group>
          <article-title>Text categorization models for retrieval of high quality articles in internal medicine</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2003</year>
          <fpage>31</fpage>
          <lpage>5</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/14728128"/>
          </comment>
          <pub-id pub-id-type="medline">14728128</pub-id>
          <pub-id pub-id-type="pii">D030003601</pub-id>
          <pub-id pub-id-type="pmcid">PMC1480096</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Aphinyanaphongs</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Aliferis</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Prospective validation of text categorization filters for identifying high-quality, content-specific articles in MEDLINE</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2006</year>
          <fpage>6</fpage>
          <lpage>10</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/17238292"/>
          </comment>
          <pub-id pub-id-type="medline">17238292</pub-id>
          <pub-id pub-id-type="pii">86426</pub-id>
          <pub-id pub-id-type="pmcid">PMC1839419</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Aphinyanaphongs</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Tsamardinos</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Statnikov</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Hardin</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Aliferis</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Text categorization models for high-quality article retrieval in internal medicine</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2005</year>
          <volume>12</volume>
          <issue>2</issue>
          <fpage>207</fpage>
          <lpage>16</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/15561789"/>
          </comment>
          <pub-id pub-id-type="doi">10.1197/jamia.M1641</pub-id>
          <pub-id pub-id-type="medline">15561789</pub-id>
          <pub-id pub-id-type="pii">M1641</pub-id>
          <pub-id pub-id-type="pmcid">PMC551552</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Afzal</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Park</surname>
              <given-names>BJ</given-names>
            </name>
            <name name-style="western">
              <surname>Hussain</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Deep Learning Based Biomedical Literature Classification Using Criteria of Scientific Rigor</article-title>
          <source>Electronics</source>
          <year>2020</year>
          <month>08</month>
          <day>05</day>
          <volume>9</volume>
          <issue>8</issue>
          <fpage>1253</fpage>
          <pub-id pub-id-type="doi">10.3390/electronics9081253</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kilicoglu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Demner-Fushman</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Rindflesch</surname>
              <given-names>TC</given-names>
            </name>
            <name name-style="western">
              <surname>Wilczynski</surname>
              <given-names>NL</given-names>
            </name>
            <name name-style="western">
              <surname>Haynes</surname>
              <given-names>RB</given-names>
            </name>
          </person-group>
          <article-title>Towards automatic recognition of scientifically rigorous clinical research evidence</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2009</year>
          <volume>16</volume>
          <issue>1</issue>
          <fpage>25</fpage>
          <lpage>31</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/18952929"/>
          </comment>
          <pub-id pub-id-type="doi">10.1197/jamia.M2996</pub-id>
          <pub-id pub-id-type="medline">18952929</pub-id>
          <pub-id pub-id-type="pii">M2996</pub-id>
          <pub-id pub-id-type="pmcid">PMC2605595</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="web">
          <article-title>McMaster Health Knowledge Refinery</article-title>
          <source>Health Information Research Unit - McMaster University</source>
          <year>2016</year>
          <access-date>2021-05-31</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://hiru.mcmaster.ca/hiru/HIRU_McMaster_HKR.aspx">https://hiru.mcmaster.ca/hiru/HIRU_McMaster_HKR.aspx</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="web">
          <article-title>Inclusion Criteria</article-title>
          <source>Health Information Research Unit - McMaster University</source>
          <year>2019</year>
          <access-date>2021-05-31</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://hiru.mcmaster.ca/hiru/InclusionCriteria.html">https://hiru.mcmaster.ca/hiru/InclusionCriteria.html</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Haynes</surname>
              <given-names>RB</given-names>
            </name>
            <name name-style="western">
              <surname>Cotoi</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Holland</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Walters</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Wilczynski</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Jedraszewski</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>McKinlay</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Parrish</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>McKibbon</surname>
              <given-names>KA</given-names>
            </name>
            <collab>McMaster Premium Literature Service (PLUS) Project</collab>
          </person-group>
          <article-title>Second-order peer review of the medical literature for clinical practitioners</article-title>
          <source>JAMA</source>
          <year>2006</year>
          <month>04</month>
          <day>19</day>
          <volume>295</volume>
          <issue>15</issue>
          <fpage>1801</fpage>
          <lpage>8</lpage>
          <pub-id pub-id-type="doi">10.1001/jama.295.15.1801</pub-id>
          <pub-id pub-id-type="medline">16622142</pub-id>
          <pub-id pub-id-type="pii">295/15/1801</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wilczynski</surname>
              <given-names>NL</given-names>
            </name>
            <name name-style="western">
              <surname>Walker</surname>
              <given-names>CJ</given-names>
            </name>
            <name name-style="western">
              <surname>McKibbon</surname>
              <given-names>KA</given-names>
            </name>
            <name name-style="western">
              <surname>Haynes</surname>
              <given-names>RB</given-names>
            </name>
          </person-group>
          <article-title>Assessment of methodologic search filters in MEDLINE</article-title>
          <source>Proc Annu Symp Comput Appl Med Care</source>
          <year>1993</year>
          <fpage>601</fpage>
          <lpage>5</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/8130545"/>
          </comment>
          <pub-id pub-id-type="medline">8130545</pub-id>
          <pub-id pub-id-type="pmcid">PMC2850647</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="web">
          <article-title>McMaster Online Rating of Evidence (MORETM)</article-title>
          <source>McMaster Premium Literature Service (PLUS) Project, McMaster University</source>
          <year>2018</year>
          <access-date>2021-05-31</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://hiru.mcmaster.ca/more/">http://hiru.mcmaster.ca/more/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="web">
          <article-title>McMaster Premium LiteratUre Service (PLUS)</article-title>
          <source>Health Information Research Unit - McMaster University</source>
          <year>2016</year>
          <access-date>2021-05-31</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://hiru.mcmaster.ca/hiru/HIRU_McMaster_PLUS_projects.aspx">https://hiru.mcmaster.ca/hiru/HIRU_McMaster_PLUS_projects.aspx</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ganaie</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Hu</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Tanveer</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Suganthan</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Ensemble deep learning: A review</article-title>
          <source>arXiv</source>
          <comment>Preprint posted online Apr 6, 2021
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://arxiv.org/abs/2104.02395"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Araque</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Corcuera-Platas</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Sánchez-Rada</surname>
              <given-names>JF</given-names>
            </name>
            <name name-style="western">
              <surname>Iglesias</surname>
              <given-names>CA</given-names>
            </name>
          </person-group>
          <article-title>Enhancing deep learning sentiment analysis with ensemble techniques in social applications</article-title>
          <source>Expert Systems with Applications</source>
          <year>2017</year>
          <month>07</month>
          <volume>77</volume>
          <fpage>236</fpage>
          <lpage>246</lpage>
          <pub-id pub-id-type="doi">10.1016/j.eswa.2017.02.002</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Qiu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>X</given-names>
            </name>
          </person-group>
          <article-title>Improving BERT Fine-Tuning via Self-Ensemble and Self-Distillation</article-title>
          <source>arXiv</source>
          <comment>Preprint posted online Feb 24, 2020
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://arxiv.org/abs/2002.10345"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Barth</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Solis</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>Applying Ensembling Methods to BERT to Boost Model Performance</article-title>
          <source>Stanford University</source>
          <access-date>2021-11-18</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://web.stanford.edu/class/archive/cs/cs224n/cs224n.1194/reports/default/15775971.pdf">https://web.stanford.edu/class/archive/cs/cs224n/cs224n.1194/reports/default/15775971.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wolf</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Debut</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Sanh</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Chaumond</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Delangue</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Moi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Cistac</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Rault</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Louf</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Funtowicz</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Davison</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Shleifer</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>von Platen</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Ma</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Jernite</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Plu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Le Scao</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Gugger</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Drame</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Lhoest</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Rush</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Transformers: State-of-the-Art Natural Language Processing</article-title>
          <year>2020</year>
          <conf-name>Proceedings of the 2020 Conference on Empirical Methods in Natural Language Processing: System Demonstrations</conf-name>
          <conf-date>Oct 2020</conf-date>
          <conf-loc>Online</conf-loc>
          <fpage>38</fpage>
          <lpage>45</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://huggingface.co/transformers/"/>
          </comment>
          <pub-id pub-id-type="doi">10.18653/v1/2020.emnlp-demos.6</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="web">
          <source>HuggingFace</source>
          <access-date>2021-11-16</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://huggingface.co/">https://huggingface.co/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Yoon</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>So</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Kang</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>BioBERT: a pre-trained biomedical language representation model for biomedical text mining</article-title>
          <source>Bioinformatics</source>
          <year>2020</year>
          <month>02</month>
          <day>15</day>
          <volume>36</volume>
          <issue>4</issue>
          <fpage>1234</fpage>
          <lpage>1240</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/31501885"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/bioinformatics/btz682</pub-id>
          <pub-id pub-id-type="medline">31501885</pub-id>
          <pub-id pub-id-type="pii">5566506</pub-id>
          <pub-id pub-id-type="pmcid">PMC7703786</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Peng</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Yan</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>Transfer Learning in Biomedical Natural Language Processing: An Evaluation of BERT and ELMo on Ten Benchmarking Datasets</article-title>
          <source>arXiv</source>
          <comment>Preprint posted online Jun 13, 2019
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://arxiv.org/abs/1906.05474"/>
          </comment>
          <pub-id pub-id-type="doi">10.18653/v1/w19-5006</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Tinn</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Cheng</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Lucas</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Usuyama</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Naumann</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Gao</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Poon</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Domain-Specific Language Model Pretraining for Biomedical Natural Language Processing</article-title>
          <source>arXiv</source>
          <comment>Preprint posted online Jul 30, 2020
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://arxiv.org/abs/2007.15779"/>
          </comment>
          <pub-id pub-id-type="doi">10.1145/3458754</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Kiros</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Zemel</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Salakhutdinov</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Urtasun</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Torralba</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Fidler</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Aligning books and movies: Towards story-like visual explanations by watching movies and reading book</article-title>
          <year>2015</year>
          <conf-name>2015 IEEE International Conference on Computer Vision (ICCV)</conf-name>
          <conf-date>December 7-13, 2015</conf-date>
          <conf-loc>Santiago, Chile</conf-loc>
          <fpage>19</fpage>
          <lpage>27</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.computer.org/csdl/proceedings-article/iccv/2015/8391a019/12OmNro0HYa"/>
          </comment>
          <pub-id pub-id-type="doi">10.1109/ICCV.2015.11</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref49">
        <label>49</label>
        <nlm-citation citation-type="web">
          <article-title>BLURB Leaderboard</article-title>
          <source>Microsoft</source>
          <year>2020</year>
          <access-date>2021-11-16</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://microsoft.github.io/BLURB/index.html#page-top">https://microsoft.github.io/BLURB/index.html#page-top</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref50">
        <label>50</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bekkar</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Djema</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Alitouche</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Evaluation measures for models assessment over imbalanced data sets</article-title>
          <source>J Info Eng Appl</source>
          <year>2013</year>
          <volume>3</volume>
          <issue>10</issue>
          <fpage>27</fpage>
          <lpage>38</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.researchgate.net/publication/292718336_Evaluation_measures_for_models_assessment_over_imbalanced_data_sets"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref51">
        <label>51</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Abdelkader</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Navarro</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Parrish</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Cotoi</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Germini</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Iorio</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Haynes</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Lokker</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Machine Learning Approaches to Retrieve High-Quality, Clinically Relevant Evidence From the Biomedical Literature: Systematic Review</article-title>
          <source>JMIR Med Inform</source>
          <year>2021</year>
          <month>09</month>
          <day>09</day>
          <volume>9</volume>
          <issue>9</issue>
          <fpage>e30401</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2021/9/e30401/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/30401</pub-id>
          <pub-id pub-id-type="medline">34499041</pub-id>
          <pub-id pub-id-type="pii">v9i9e30401</pub-id>
          <pub-id pub-id-type="pmcid">PMC8461527</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref52">
        <label>52</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Watson</surname>
              <given-names>DS</given-names>
            </name>
            <name name-style="western">
              <surname>Krutzinna</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Bruce</surname>
              <given-names>IN</given-names>
            </name>
            <name name-style="western">
              <surname>Griffiths</surname>
              <given-names>CE</given-names>
            </name>
            <name name-style="western">
              <surname>McInnes</surname>
              <given-names>IB</given-names>
            </name>
            <name name-style="western">
              <surname>Barnes</surname>
              <given-names>MR</given-names>
            </name>
            <name name-style="western">
              <surname>Floridi</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Clinical applications of machine learning algorithms: beyond the black box</article-title>
          <source>BMJ</source>
          <year>2019</year>
          <month>03</month>
          <day>12</day>
          <volume>364</volume>
          <fpage>l886</fpage>
          <pub-id pub-id-type="doi">10.1136/bmj.l886</pub-id>
          <pub-id pub-id-type="medline">30862612</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref53">
        <label>53</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hoeren</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Niehoff</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Artificial Intelligence in Medical Diagnoses and the Right to Explanation</article-title>
          <source>European Data Protection Law Review</source>
          <year>2018</year>
          <volume>4</volume>
          <issue>3</issue>
          <fpage>308</fpage>
          <lpage>319</lpage>
          <pub-id pub-id-type="doi">10.21552/edpl/2018/3/9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref54">
        <label>54</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Du</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Hu</surname>
              <given-names>X</given-names>
            </name>
          </person-group>
          <article-title>Techniques for Interpretable Machine Learning</article-title>
          <source>arXiv</source>
          <comment>Preprint posted online Jul 31, 2018
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://arxiv.org/abs/1808.00033"/>
          </comment>
          <pub-id pub-id-type="doi">10.1145/3359786</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref55">
        <label>55</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chakraborty</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Tomsett</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Raghavendra</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Harborne</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Alzantot</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Cerutti</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Srivastava</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Preece</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Julier</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Rao</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Kelley</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Braines</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Sensoy</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Willis</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Gurram</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Interpretability of deep learning models: A survey of results</article-title>
          <year>2017</year>
          <conf-name>IEEE SmartWorld, Ubiquitous Intelligence &#38; Computing, Advanced &#38; Trusted Computed, Scalable Computing &#38; Communications, Cloud &#38; Big Data Computing, Internet of People and Smart City Innovation (SmartWorld/SCALCOM/UIC/ATC/CBDCom/IOP/SCI)</conf-name>
          <conf-date>Aug 4-7, 2017</conf-date>
          <conf-loc>San Francisco, CA</conf-loc>
          <pub-id pub-id-type="doi">10.1109/uic-atc.2017.8397411</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
