<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
    <front>
        <journal-meta>
            <journal-id journal-id-type="publisher-id">ResProt</journal-id>
            <journal-id journal-id-type="nlm-ta">JMIR Res Protoc</journal-id>
            <journal-title>JMIR Research Protocols</journal-title>
            <issn pub-type="epub">1929-0748</issn>
            <publisher>
                <publisher-name>JMIR Publications Inc.</publisher-name>
                <publisher-loc>Toronto, Canada</publisher-loc>
            </publisher>
        </journal-meta>
        <article-meta>
            <article-id pub-id-type="publisher-id">v5i2e40</article-id>
            <article-id pub-id-type="pmid">27066806</article-id>
            <article-id pub-id-type="doi">10.2196/resprot.5028</article-id>
            <article-categories>
                <subj-group subj-group-type="heading">
                    <subject>Original Paper</subject>
                </subj-group>
                <subj-group subj-group-type="article-type">
                    <subject>Original Paper</subject>
                </subj-group>
            </article-categories>
            <title-group>
                <article-title>Using Nonexperts for Annotating Pharmacokinetic Drug-Drug Interaction Mentions in Product Labeling: A Feasibility Study</article-title>
            </title-group>
            <contrib-group>
                <contrib contrib-type="editor">
                    <name>
                        <surname>Eysenbach</surname>
                        <given-names>Gunther</given-names>
                    </name>
                </contrib>
            </contrib-group>
            <contrib-group>
                <contrib contrib-type="reviewer">
                    <name>
                        <surname>Doing-Harris</surname>
                        <given-names>Kristina</given-names>
                    </name>
                </contrib>
                <contrib contrib-type="reviewer">
                    <name>
                        <surname>Schulz</surname>
                        <given-names>Peter</given-names>
                    </name>
                </contrib>
            </contrib-group>
            <contrib-group>
                <contrib contrib-type="author" id="contrib1" corresp="yes">
                    <name name-style="western">
                        <surname>Hochheiser</surname>
                        <given-names>Harry</given-names>
                    </name>
                    <degrees>PhD</degrees>
                    <xref rid="aff1" ref-type="aff">1</xref>
                    <address>
                        <institution>Department of Biomedical Informatics</institution>
                        <institution>School of Medicine</institution>
                        <institution>University of Pittsburgh</institution>
                        <addr-line>5607 Baum Blvd</addr-line>
                        <addr-line>Suite 523</addr-line>
                        <addr-line>Pittsburgh, PA, </addr-line>
                        <country>United States</country>
                        <phone>1 412 648 9300</phone>
                        <fax>1 412 624 5310</fax>
                        <email>harryh@pitt.edu</email>
                    </address>
                    <xref rid="aff2" ref-type="aff">2</xref>
                    <ext-link ext-link-type="orcid">http://orcid.org/0000-0001-8793-9982</ext-link>
                </contrib>
                <contrib contrib-type="author" id="contrib2">
                    <name name-style="western">
                        <surname>Ning</surname>
                        <given-names>Yifan</given-names>
                    </name>
                    <degrees>MS</degrees>
                    <xref rid="aff1" ref-type="aff">1</xref>
                    <ext-link ext-link-type="orcid">http://orcid.org/0000-0002-0883-4742</ext-link>
                </contrib>
                <contrib contrib-type="author" id="contrib3">
                    <name name-style="western">
                        <surname>Hernandez</surname>
                        <given-names>Andres</given-names>
                    </name>
                    <degrees>MS</degrees>
                    <xref rid="aff1" ref-type="aff">1</xref>
                    <xref rid="aff3" ref-type="aff">3</xref>
                    <ext-link ext-link-type="orcid">http://orcid.org/0000-0001-6037-5451</ext-link>
                </contrib>
                <contrib contrib-type="author" id="contrib4">
                    <name name-style="western">
                        <surname>Horn</surname>
                        <given-names>John R</given-names>
                    </name>
                    <degrees>PharmD</degrees>
                    <xref rid="aff4" ref-type="aff">4</xref>
                    <ext-link ext-link-type="orcid">http://orcid.org/0000-0003-4525-4250</ext-link>
                </contrib>
                <contrib contrib-type="author" id="contrib5">
                    <name name-style="western">
                        <surname>Jacobson</surname>
                        <given-names>Rebecca</given-names>
                    </name>
                    <degrees>MS, MD</degrees>
                    <xref rid="aff1" ref-type="aff">1</xref>
                    <xref rid="aff2" ref-type="aff">2</xref>
                    <ext-link ext-link-type="orcid">http://orcid.org/0000-0002-5719-8340</ext-link>
                </contrib>
                <contrib contrib-type="author" id="contrib6">
                    <name name-style="western">
                        <surname>Boyce</surname>
                        <given-names>Richard D</given-names>
                    </name>
                    <degrees>PhD</degrees>
                    <xref rid="aff1" ref-type="aff">1</xref>
                    <ext-link ext-link-type="orcid">http://orcid.org/0000-0002-2993-2085</ext-link>
                </contrib>
            </contrib-group>
            <aff id="aff1">
                <sup>1</sup>
                <institution>Department of Biomedical Informatics</institution>
                <institution>School of Medicine</institution>
                <institution>University of Pittsburgh</institution>
                <addr-line>Pittsburgh, PA</addr-line>
                <country>United States</country>
            </aff>
            <aff id="aff2">
                <sup>2</sup>
                <institution>Intelligent Systems Program</institution>
                <institution>University of Pittsburgh</institution>
                <addr-line>Pittsburgh, PA</addr-line>
                <country>United States</country>
            </aff>
            <aff id="aff3">
                <sup>3</sup>
                <institution>Center for Bioinformatics and Computational Biology</institution>
                <institution>BIOS</institution>
                <addr-line>Manizales</addr-line>
                <country>Colombia</country>
            </aff>
            <aff id="aff4">
                <sup>4</sup>
                <institution>Department of Pharmacy</institution>
                <institution>School of Pharmacy and University of Washington Medicine, Pharmacy Services</institution>
                <institution>University of Washington</institution>
                <addr-line>Seattle, WA</addr-line>
                <country>United States</country>
            </aff>
            <author-notes>
                <corresp>Corresponding Author: Harry Hochheiser <email>harryh@pitt.edu</email>
                </corresp>
            </author-notes>
            <pub-date pub-type="collection">
                <season>Apr-Jun</season>
                <year>2016</year>
            </pub-date>
            <pub-date pub-type="epub">
                <day>11</day>
                <month>04</month>
                <year>2016</year>
            </pub-date>
            <volume>5</volume>
            <issue>2</issue>
            <elocation-id>e40</elocation-id>
            <!--history from ojs - api-xml-->
            <history>
                <date date-type="received">
                    <day>17</day>
                    <month>8</month>
                    <year>2015</year>
                </date>
                <date date-type="rev-request">
                    <day>12</day>
                    <month>11</month>
                    <year>2015</year>
                </date>
                <date date-type="rev-recd">
                    <day>25</day>
                    <month>11</month>
                    <year>2015</year>
                </date>
                <date date-type="accepted">
                    <day>19</day>
                    <month>12</month>
                    <year>2015</year>
                </date>
            </history>
            <!--(c) the authors - correct author names and publication date here if necessary. Date in form ', dd.mm.yyyy' after jmir.org-->
            <copyright-statement>&#169;Harry Hochheiser, Yifan Ning, Andres Hernandez, John R Horn, Rebecca Jacobson, Richard D Boyce. Originally published in JMIR Research Protocols (http://www.researchprotocols.org), 11.04.2016. </copyright-statement>
            <copyright-year>2016</copyright-year>
            <license license-type="open-access" xlink:href="http://creativecommons.org/licenses/by/2.0/">
                <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (http://creativecommons.org/licenses/by/2.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Research Protocols, is properly cited. The complete bibliographic information, a link to the original publication on http://www.researchprotocols.org, as well as this copyright and license information must be included.</p>
            </license>
            <self-uri xlink:href="http://www.researchprotocols.org/2016/2/e40/" xlink:type="simple" />
            <abstract>
                <sec sec-type="background">
                    <title>Background</title>
                    <p>Because vital details of potential pharmacokinetic drug-drug interactions are often described in free-text structured product labels, manual curation is a necessary but expensive step in the development of electronic drug-drug interaction information resources. The use of nonexperts to annotate potential drug-drug interaction (PDDI) mentions in drug product label annotation may be a means of lessening the burden of manual curation.</p>
                </sec>
                <sec sec-type="objective">
                    <title>Objective</title>
                    <p>Our goal was to explore the practicality of using nonexpert participants to annotate drug-drug interaction descriptions from structured product labels. By presenting annotation tasks to both pharmacy experts and relatively na&#239;ve participants, we hoped to demonstrate the feasibility of using nonexpert annotators for drug-drug information annotation. We were also interested in exploring whether and to what extent natural language processing (NLP) preannotation helped improve task completion time, accuracy, and subjective satisfaction.</p>
                </sec>
                <sec sec-type="methods">
                    <title>Methods</title>
                    <p>Two experts and 4 nonexperts were asked to annotate 208 structured product label sections under 4 conditions completed sequentially: (1) no NLP assistance, (2) preannotation of drug mentions, (3) preannotation of drug mentions and PDDIs, and (4) a repeat of the no-annotation condition. Results were evaluated within the 2 groups and relative to an existing gold standard. Participants were asked to provide reports on the time required to complete tasks and their perceptions of task difficulty.</p>
                </sec>
                <sec sec-type="results">
                    <title>Results</title>
                    <p>One of the experts and 3 of the nonexperts completed all tasks. Annotation results from the nonexpert group were relatively strong in every scenario and better than the performance of the NLP pipeline. The expert and 2 of the nonexperts were able to complete most tasks in less than 3 hours. Usability perceptions were generally positive (3.67 for expert, mean of 3.33 for nonexperts).</p>
                </sec>
                <sec sec-type="conclusions">
                    <title>Conclusions</title>
                    <p>The results suggest that nonexpert annotation might be a feasible option for comprehensive labeling of annotated PDDIs across a broader range of drug product labels. Preannotation of drug mentions may ease the annotation task. However, preannotation of PDDIs, as operationalized in this study, presented the participants with difficulties. Future work should test if these issues can be addressed by the use of better performing NLP and a different approach to presenting the PDDI preannotations to users during the annotation workflow.</p>
                </sec>
            </abstract>
            <kwd-group>
                <kwd>crowdsourcing</kwd>
                <kwd>natural language processing</kwd>
                <kwd>drug interactions, drug product labeling, structured product labels</kwd>
            </kwd-group>
        </article-meta>
    </front>
    <body>
        <sec sec-type="introduction">
            <title> Introduction</title>
            <p> Exposure to interacting drug combinations can lead to patient harm. Recent estimates indicate that between 5.3% and 14.3% of hospital patients in the United States experience a clinically meaningful alteration in the exposure or response of one drug occurring as a result of coadministration of another drug [<xref ref-type="bibr" rid="ref1">1</xref>]. Fortunately, such harm can often be avoided by employing appropriate management strategies [<xref ref-type="bibr" rid="ref2">2</xref>]. Toward that goal, US federal regulations require the mention of known, clinically relevant potential drug-drug interactions (PDDIs) in prescription drug labeling [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref4">4</xref>].</p>
            <p>Structured product labels (SPLs) are mandated by the US Food and Drug Administration. The labels, produced by pharmaceutical manufacturers, are presented in a standardized format [<xref ref-type="bibr" rid="ref5">5</xref>] and approved by regulators. As detailed descriptions subject to regulatory approval, SPLs play a vital role in disseminating drug information. However, the structure in these documents is only in the form of high-level sections such as <italic>Description</italic>, <italic>Indications and Usage</italic>, <italic>Contraindications</italic>, and <italic>Warnings</italic>. Specific PDDI details are given in plain text, tables, and figures within the <italic>Drug Interactions</italic> section or other locations throughout the label. Although future efforts may lead to more structured and therefore more computable labels, the regulatory importance of the SPLs and the legacy labels of more than 16,000 drugs make the labels key resources for drug-drug interaction information.</p>
            <p>Unfortunately, product labeling is incomplete. A study of drugs that interact with the narrow therapeutic range drug warfarin found PDDI information deficiencies in 15% of relevant product labels [<xref ref-type="bibr" rid="ref6">6</xref>]. A broader study of drugs sold in the United States, United Kingdom, and Germany found that a warning about a critical drug interaction was missing from the label of one of the interacting drugs at least 40% of the time [<xref ref-type="bibr" rid="ref7">7</xref>]. Although publicly available PDDI information sources can serve as useful adjuncts to product label information, these collections are often far from complete. Our recent analysis of 14 collections of PDDI information found significant divergence, with overlap between pairs of sources usually less than 50% [<xref ref-type="bibr" rid="ref8">8</xref>]. Addressing the issue of missing product label PDDI information is important to better meet the information needs of drug experts, clinicians, and patients.</p>
            <p>We hypothesize that a computable representation of PDDIs present in product labels and other high-quality sources will enable novel methods for drug information retrieval that will in turn provide researchers and clinicians with improved capabilities for finding complete and current DDI information. Testing this hypothesis requires an efficient means of generating computable representations of PDDI mentions.</p>
            <p>In prior work, we developed a prototype system that used simple named entity recognition (NER) and Semantic Web Linked Data [<xref ref-type="bibr" rid="ref9">9</xref>] to link claims about PDDIs from publicly available external resources to the <italic>Drug Interactions</italic> section of the product label [<xref ref-type="bibr" rid="ref10">10</xref>]. Experiments found that our system linked at least one potentially novel interaction (ie, not mentioned in the label) to the <italic>Drug Interactions</italic> section of product labeling for 20 antidepressants. Moreover, there were several cases where all of the PDDI mentions linked to the <italic>Drug Interactions</italic> section for an antidepressant were potentially novel and would complement product label information. For example, an interaction between escitalopram and tapentadol mentioned in the National Drug File-Reference Terminology [<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref12">12</xref>] was potentially novel to all 20 escitalopram product labels.</p>
            <p>While promising, the simple NER approach often missed potentially important links between the label and other sources. Sophisticated natural language processing (NLP) methods might prove to be more complete, accurate, and scalable than simple NER. However, there is reason to believe that even the best NLP methods would not perform well enough to guarantee automatic identification of all PDDI mentions across all drug product labels. The PDDI NLP algorithm that performed best against the 2013 SemEval Challenge text corpus had a sentence-level recall of 0.81 and a precision of 0.86 (F<sub>1</sub> =0.84)[<xref ref-type="bibr" rid="ref13">13</xref>]. An algorithm we developed in prior work focusing specifically on NLP identification of pharmacokinetic PDDI mentions within product label sections had a document level recall of 0.84 and a precision of 0.88 (F<sub>1</sub>=0.86) [<xref ref-type="bibr" rid="ref14">14</xref>] (sentence-level performance was not evaluated).</p>
            <p>Based on these findings, we have concluded that the involvement of human curators is necessary for the task of generating computable representations of PDDIs present in product labels and other high-quality sources. The use of semiautomatic curation is relatively common in biomedicine [<xref ref-type="bibr" rid="ref15">15</xref>]. Unfortunately, the high cost of expert annotation is a major potential barrier to further progress. New approaches are needed to increase the scale and quality of data curation.</p>
            <p>Replacing experts with nonexpert crowds (crowdsourcing) can increase the feasibility of large-scale annotation tasks for biomedical data [<xref ref-type="bibr" rid="ref16">16</xref>-<xref ref-type="bibr" rid="ref18">18</xref>]. Initial efforts at crowdsourcing for the annotation of medical text have found the method to be effective when the workflow is properly managed [<xref ref-type="bibr" rid="ref16">16</xref>]. Results can be comparable in quality to those obtained via more traditional and expensive expert annotation methods [<xref ref-type="bibr" rid="ref17">17</xref>]. Crowdsourcing is particularly attractive for obtaining results faster and at a lower cost than other participant recruitment schemes [<xref ref-type="bibr" rid="ref17">17</xref>]. The Informatics for Integrating Biology and the Bedside (i2b2) 2010 workshop assessment found that a well-selected group of nonexperts could perform extraction of drug information from clinical reports [<xref ref-type="bibr" rid="ref19">19</xref>]. Other biomedical efforts have applied crowdsourcing to gene-mutation mentions in the biomedical literature [<xref ref-type="bibr" rid="ref20">20</xref>] and for clinical trial announcements [<xref ref-type="bibr" rid="ref21">21</xref>]. A study of the feasibility of using people recruited through Amazon&#8217;s Mechanical Turk to annotate medication indications found that nonexperts could achieve accuracy of greater than 95% on the binary question of whether a medication is an indication for a disease mentioned in the medication&#8217;s drug label [<xref ref-type="bibr" rid="ref22">22</xref>]. Similar approaches have been used to engage communities of experts in tackling challenges such as linking medications and problems in clinical texts from electronic medical records [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref24">24</xref>] and developing mappings between institutional procedure descriptions and Logical Observation Identifiers Names and Codes (LOINC) [<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref26">26</xref>].</p>
            <p>Our experience with NLP methods for extracting PDDI annotations suggests the possibility of using NLP annotation to provide suggestions to human annotators. Previous efforts have explored the possibility of using such preannotation. Hanauer et al [<xref ref-type="bibr" rid="ref27">27</xref>] found that iterative alternation between human annotation and model building facilitated rapid creation of NLP models. Some comparative studies have shown that preannotation can improve annotator performance relative to unassisted annotation [<xref ref-type="bibr" rid="ref28">28</xref>-<xref ref-type="bibr" rid="ref30">30</xref>], but other studies have seen no difference [<xref ref-type="bibr" rid="ref31">31</xref>].</p>
            <p>The goal of this study was to assess the potential feasibility of using persons who are not drug experts in the task of annotating PDDIs mentioned in drug product labels. A secondary goal was to test the influence of NLP assistance on the annotation quality of both experts and nonexperts.</p>
        </sec>
        <sec sec-type="methods">
            <title>Methods</title>
            <sec>
                <title>The Annotation Model</title>
                <p>PDDI annotation requires a data model that describes the types of information that must be collected. The PDDI data model used in this study is given in <xref ref-type="fig" rid="figure1">Figure 1</xref>. Each PDDI mention is extracted from a span of sentences present within a product label and can include four features:</p>
                <list list-type="bullet">
                    <list-item>
                        <p>Type of evidence (active ingredient, metabolite, or drug product): an active ingredient is a pharmacologically active chemical component used in a drug product. A metabolite is a biochemical entity produced as a result of drug metabolism. A drug product is a packaging of an active ingredient for sale or distribution, often identified by a brand name. Throughout this paper, we use the generic term &#8220;drug&#8221; to mean any of these three types.</p>
                    </list-item>
                    <list-item>
                        <p>Role (object or precipitant): the role that each drug plays within the interaction. In pharmacokinetic PDDIs the precipitant drug affects an enzyme that regulates the absorption, distribution metabolism, or excretion of the object drug.</p>
                    </list-item>
                    <list-item>
                        <p>Statement (quantitative or qualitative): an indication of whether the PDDI mention describes the pharmacokinetic effect of a DDI in quantitative terms (50% increase) or qualitative terms (increase or decrease) with no indication of magnitude.</p>
                    </list-item>
                    <list-item>
                        <p>Modality (positive or negative): whether the PDDI mention is making a positive or negative claim. A positive claim is one that supports the existence of the interaction. A negative claim is one that explicitly states that no interaction exists between the drugs in question.</p>
                    </list-item>
                </list>
                <fig id="figure1" position="float">
                    <label>Figure 1</label>
                    <caption>
                        <p>Data model used in this study for PDDIs mentioned within drug product labels.</p>
                    </caption>
                    <graphic xlink:href="resprot_v5i2e40_fig1.jpg" alt-version="no" mimetype="image" position="float" xlink:type="simple" />
                </fig>
            </sec>
            <sec>
                <title>Natural Language Processing Pipeline and Postprocessing Module</title>
                <p>In prior work, we developed algorithms for extracting drug named entities and pharmacokinetic PDDI mentions from drug product labels [<xref ref-type="bibr" rid="ref14">14</xref>]. We integrated our NLP algorithms into a preannotation pipeline (<xref ref-type="fig" rid="figure2">Figure 2</xref>). The pipeline used the following steps:</p>
                <list list-type="order">
                    <list-item>
                        <p>The NLP process applies NER to each product label section [<xref ref-type="bibr" rid="ref32">32</xref>]. The NER algorithm uses the National Center for Biomedical Ontology BioPortal Annotator to extract drug mentions and synonyms from the RxNorm and MeSH terminologies [<xref ref-type="bibr" rid="ref33">33</xref>]. The results are postprocessed to improve recall and precision by filtering out entities that are not active ingredients, drug products, or metabolites based on entity relationships provided by RxNorm and WordNet [<xref ref-type="bibr" rid="ref34">34</xref>].</p>
                    </list-item>
                    <list-item>
                        <p>Output from the NER process is then processed by an NLP algorithm for identifying pharmacokinetic PDDI mentions [<xref ref-type="bibr" rid="ref14">14</xref>]. For each product label section, the PDDI extraction algorithm outputs a table of sentence spans labeled as to whether they include a pharmacokinetic PDDI (true or false). Spans including PDDI mentions are also labeled to indicate the modality of the mention (positive or negative). Output of the NLP algorithm is passed to a postprocessing module designed to increase the process's precision and recall (<xref ref-type="fig" rid="figure2">Figure 2</xref>). This module uses RxNorm relationships and exact case-insensitive matching to map drug product mentions to unique identifiers of the sole active ingredients.</p>
                    </list-item>
                    <list-item>
                        <p>The PDDI mentions present in the corpus are transformed into a machine-readable annotation schema using the Open Annotation data model [<xref ref-type="bibr" rid="ref35">35</xref>], necessary for subsequent loading into the study annotation tool.</p>
                    </list-item>
                    <list-item>
                        <p>Finally, the resulting preannotated named entities and PDDI mentions are loaded into the study annotation tool.</p>
                    </list-item>
                </list>
                <fig id="figure2" position="float">
                    <label>Figure 2</label>
                    <caption>
                        <p>Pipeline for extraction of pharmacokinetic PDDIs from drug labels sections.</p>
                    </caption>
                    <graphic xlink:href="resprot_v5i2e40_fig2.jpg" alt-version="no" mimetype="image" position="float" xlink:type="simple" />
                </fig>
            </sec>
            <sec>
                <title>Reference Standard</title>
                <p>In an earlier study, we developed a corpus of 208 annotated PDDI statements from SPLs. Two experts in drug information used the data model described above to annotate these sections, with subsequent discussions used to develop a consensus model. The resulting corpus contains 607 pharmacokinetic PDDI mentions along with 3351 active ingredients, 234 drug products, and 201 metabolite mentions [<xref ref-type="bibr" rid="ref14">14</xref>]. These sections were used in the current study, with the consensus annotations acting as a gold standard.</p>
            </sec>
            <sec>
                <title>Drug-Drug Interaction Annotation Tool</title>
                <p>Participants used a custom-designed user interface (<xref ref-type="fig" rid="figure3">Figure 3</xref>) based on the DOMEO Web-based system [<xref ref-type="bibr" rid="ref36">36</xref>] to annotate PDDI mentions. DOMEO is an extensible Web application that supports scalable Web-based annotation necessary for crowdsourcing efforts [<xref ref-type="bibr" rid="ref37">37</xref>]. We extended DOMEO with a plugin that can be used to link text in drug label sections with details of the PDDI data model (<xref ref-type="fig" rid="figure1">Figure 1</xref>) [<xref ref-type="bibr" rid="ref38">38</xref>]. To complete a PDDI annotation task, users would view a product label section and select one or more sentences from the section that discusses the PDDI. They would then use our PDDI annotation plugin to provide values in a Web form indicating the two drugs involved in the interaction, the type and role for each drug, the type of PDDI mention (quantitative or qualitative), and the modality of the mention (positive or negative).</p>
                <fig id="figure3" position="float">
                    <label>Figure 3</label>
                    <caption>
                        <p>Screenshots of the DOMEO PDDI annotation plugin: (a) product label excerpt with text selected by an annotator as being relevant to a PDDI and (b) form with the fields that the annotator must complete in order to describe the PDDI using the data model described in <xref ref-type="fig" rid="figure1">Figure 1</xref>.</p>
                    </caption>
                    <graphic xlink:href="resprot_v5i2e40_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple" />
                </fig>
            </sec>
            <sec>
                <title>Annotation Scenarios</title>
                <p>We explored four annotation scenarios aimed at assessing the impact of different approaches to NLP preannotation. The 208 product label sections from our reference standard [<xref ref-type="bibr" rid="ref14">14</xref>] were distributed across four scenarios so that each scenario had roughly the same number of long and short sections:</p>
                <list list-type="bullet">
                    <list-item>
                        <p>Scenario 1 (no assistance) consisted of 52 label sections with no NLP assistance for annotation. Annotators had to read and highlight all drugs and PDDI mentions within the assigned drug label sections.</p>
                    </list-item>
                    <list-item>
                        <p>Scenario 2 (drug mentions) consisted of 52 drug label sections with preannotations for drug mentions but not PDDI mentions. Annotators had to correct preannotated drug mentions, identify any drug mentions that the NLP missed, and highlight all PDDIs mentioned in the label sentences.</p>
                    </list-item>
                    <list-item>
                        <p>Scenario 3 (drug mention plus PDDIs) consisted of 53 label sections preannotated with both drug and PDDI mentions. The annotator had to edit and correct NLP preannotations and add any mentions missed by the NLP.</p>
                    </list-item>
                    <list-item>
                        <p>Scenario 4 (no assistance, second time), a second completely unassisted scenario, was included with the intent of measuring any learning effects associated with the completion of the NLP-assisted tasks. This scenario consisted of 48 drug label sections.</p>
                    </list-item>
                </list>
                <p>Each participant completed all four scenarios in order. Three of the 208 sections were reserved for training purposes to familiarize participants with the annotation tool and process, leaving 205 sections to be annotated by each participant.</p>
            </sec>
            <sec>
                <title>Participants</title>
                <p>A drug expert was defined as a professional in pharmacy or related field with a Doctor of Pharmacy degree or equivalent and more than five years&#8217; experience in drug-drug interaction research. A drug nonexpert was defined as an undergraduate or graduate student with some basic training in chemistry. Both expert and nonexpert participants were recruited from personal contacts of the investigative team. All participants were compensated for participating in this study. The University of Pittsburgh Institutional Review Board approved the study protocol as exempt.</p>
            </sec>
            <sec>
                <title>Annotator Guidelines and Training</title>
                <p>Annotators were provided with guidelines describing the annotation task. Guidelines were written based on assumption of college-level formal training in chemistry (eg, general chemistry) for both groups. The complete guidelines are provided in <xref ref-type="app" rid="app1">Multimedia Appendix 1</xref>. Participants attended a half-day training session that introduced the goal of the annotation task and provided the annotation guidelines.</p>
            </sec>
            <sec>
                <title>Annotation Tasks</title>
                <p>Each participant completed all of the four scenarios in the order given above. For each task, the annotators were asked to read the entire content of the relevant drug label sections, identify all drug and PDDI mentions, and record information about the PDDI corresponding to the PDDI annotation model. They were also asked to self-report the amount of time it took to completely annotate each section. The results of each training task were verified to ensure that each annotator completed each scenario according to the study requirements. A short questionnaire completed at the end of each scenario included closed- and open-ended questions about the participant's perception of the usability and effectiveness of the annotation tool and NLP preannotation.</p>
            </sec>
            <sec>
                <title>Annotation Performance Metrics</title>
                <p>Performance metrics were calculated by comparing the PDDIs in each participant's results with the reference standard described above [<xref ref-type="bibr" rid="ref14">14</xref>]. User&#8217;s annotations were considered true positives if they (a) matched the precipitant, object, and modality of the reference standard and (b) used sentences that either partially or exactly overlapped the sentences used in the reference standard. Metrics were computed by label and then averaged by scenario.</p>
                <p>We supplemented the standard metrics of precision, recall, and F<sub>1</sub> with additional metrics to gain more insight into the effect of NLP preannotation on the PDDI annotation task. Specifically, for Scenario 3 (ie, the full NER plus NLP preannotation), we evaluated how often participants decided to change NLP annotations and whether those NLP annotations agreed or disagreed with the reference standard.</p>
            </sec>
        </sec>
        <sec sec-type="results">
            <title> Results</title>
            <p>Two experts and 4 nonexperts were recruited into the study. One expert left the study after experiencing too many difficulties with the PDDI annotation user interface. One nonexpert left the study because of not having time to complete annotations due to work and school commitments. The remaining participants completed the annotation task for all scenarios.</p>
            <p>Annotation performances measured in F<sub>1</sub> score relative to the reference standard [<xref ref-type="bibr" rid="ref14">14</xref>] indicate relatively strong performance (F<sub>1</sub>&#62;0.7) for all participants for the first two scenarios, with a drop in performance for the last two scenarios. (<xref ref-type="fig" rid="figure4">Figure 4</xref> and <xref ref-type="table" rid="table1">Table 1</xref>; full recall and precision results in <xref ref-type="app" rid="app2">Multimedia Appendix 2</xref>). The performance of the entire NLP pipeline is included for each scenario for comparison even though participants were only provided PDDI preannotations in Scenario 3.</p>
            <p>
                <xref ref-type="table" rid="table2">Tables 2</xref> and <xref ref-type="table" rid="table3">3</xref> summarize self-reported task completion times and subjective feedback across the first three scenarios. As Scenario 4 was conducted solely to assess learning effects, task completion time and subjective responses were not collected. Participants differed in their reports of time required, ranging from Nonexpert 1 reporting times comparable to those of the expert to Nonexpert 3 reporting more than 5 hours spent completing Scenario 3 (<xref ref-type="table" rid="table2">Table 2</xref>).</p>
            <p>Results from the subjective question assessing ease of use are given in <xref ref-type="table" rid="table3">Table 3</xref>. Users agreed that the PDDI annotation interface was moderately difficult when full preannotation assistance was enabled and also agreed that the PDDI annotation plugin without NLP assistance or using a lower level of assistance is relatively easy to use. Full questionnaires and results are given in <xref ref-type="app" rid="app3">multimedia appendices 3-7</xref>.</p>
            <p>
                <xref ref-type="table" rid="table4">Tables 4</xref> and <xref ref-type="table" rid="table5">5</xref> illustrate the agreement between the participants, NLP, and reference standard in the scenario with NLP and preannotation assistance (Scenario 3). <xref ref-type="table" rid="table4">Table 4</xref> addresses performance on the 151 PDDI annotations found in the reference standard, while <xref ref-type="table" rid="table5">Table 5</xref> summarizes false positives&#8212;mentions extracted in the NLP or by users that were not found in the reference standard.</p>
            <p>Though exploratory because of the very small sample size, success in detecting true-positive PDDI mentions missed by the NLP was similar between the expert and nonexperts (<xref ref-type="table" rid="table4">Table 4</xref>, column 2). The expert also had slightly more false negatives than the nonexpert participants irrespective of whether spans were found by NLP (<xref ref-type="table" rid="table4">Table 4</xref>, columns 1 and 3). False-positive rates for the expert were comparable to those of the nonexperts (<xref ref-type="table" rid="table5">Table 5</xref>, column 1). Nonexperts also seemed to be slightly more likely to agree with false-positive mentions extracted by the NLP (<xref ref-type="table" rid="table5">Table 5</xref>, columns 2 and 3).</p>
            <table-wrap position="float" id="table1">
                <label>Table 1</label>
                <caption>
                    <p>F<sub>1</sub> measures for all participants and NLP system across all scenarios and overall.</p>
                </caption>
                <table width="516" border="0" cellpadding="7" cellspacing="0" rules="groups" frame="hsides">
                    <col width="88" />
                    <col width="70" />
                    <col width="70" />
                    <col width="64" />
                    <col width="64" />
                    <col width="76" />
                    <thead>
                        <tr valign="bottom">
                            <td>Annotator</td>
                            <td>Scenario<break />1<sup>a</sup>
                            </td>
                            <td>Scenario<break />2<sup>b</sup>
                            </td>
                            <td>Scenario<break />3<sup>c</sup>
                            </td>
                            <td>Scenario<break />4<sup>d</sup>
                            </td>
                            <td>Overall</td>
                        </tr>
                    </thead>
                    <tbody>
                        <tr valign="top">
                            <td>Expert</td>
                            <td>0.80</td>
                            <td>0.79</td>
                            <td>0.54</td>
                            <td>0.66</td>
                            <td>0.68</td>
                        </tr>
                        <tr valign="top">
                            <td>Nonexpert 1</td>
                            <td>0.79</td>
                            <td>0.83</td>
                            <td>0.59</td>
                            <td>0.53</td>
                            <td>0.66</td>
                        </tr>
                        <tr valign="top">
                            <td>Nonexpert 2</td>
                            <td>0.76</td>
                            <td>0.68</td>
                            <td>0.57</td>
                            <td>0.70</td>
                            <td>0.67</td>
                        </tr>
                        <tr valign="top">
                            <td>Nonexpert 3</td>
                            <td>0.74</td>
                            <td>0.62</td>
                            <td>0.53</td>
                            <td>0.62</td>
                            <td>0.61</td>
                        </tr>
                        <tr valign="top">
                            <td>NLP</td>
                            <td>0.58</td>
                            <td>0.40</td>
                            <td>0.41</td>
                            <td>0.46</td>
                            <td>0.46</td>
                        </tr>
                    </tbody>
                </table>
                <table-wrap-foot>
                    <fn id="table1fn1">
                        <p>
                            <sup>a</sup>No assistance.</p>
                    </fn>
                    <fn id="table1fn2">
                        <p>
                            <sup>b</sup>Preannotation of drug mentions.</p>
                    </fn>
                    <fn id="table1fn3">
                        <p>
                            <sup>c</sup>Preannotation of drug mentions and PDDIs.</p>
                    </fn>
                    <fn id="table1fn4">
                        <p>
                            <sup>d</sup>No assistance.</p>
                    </fn>
                </table-wrap-foot>
            </table-wrap>
            <table-wrap position="float" id="table2">
                <label>Table 2</label>
                <caption>
                    <p>Participant self-reported task completion times.</p>
                </caption>
                <table width="590" border="1" cellpadding="7" cellspacing="0" rules="groups" frame="hsides">
                    <col width="94" />
                    <col width="74" />
                    <col width="84" />
                    <col width="84" />
                    <col width="84" />
                    <col width="84" />
                    <thead>
                        <tr valign="top">
                            <td>Participant</td>
                            <td>Scenario</td>
                            <td>&#60;1 hour</td>
                            <td>1-3 hours</td>
                            <td>3-5 hours</td>
                            <td>&#62;5 hours</td>
                        </tr>
                    </thead>
                    <tbody>
                        <tr valign="top">
                            <td>Expert</td>
                            <td>
                                <break />
                            </td>
                            <td>
                                <break />
                            </td>
                            <td>
                                <break />
                            </td>
                            <td>
                                <break />
                            </td>
                            <td>
                                <break />
                            </td>
                        </tr>
                        <tr valign="top">
                            <td>
                                <break />
                            </td>
                            <td>1</td>
                            <td>X</td>
                            <td>
                                <break />
                            </td>
                            <td>
                                <break />
                            </td>
                            <td>
                                <break />
                            </td>
                        </tr>
                        <tr valign="top">
                            <td>
                                <break />
                            </td>
                            <td>2</td>
                            <td>X</td>
                            <td>
                                <break />
                            </td>
                            <td>
                                <break />
                            </td>
                            <td>
                                <break />
                            </td>
                        </tr>
                        <tr valign="top">
                            <td>
                                <break />
                            </td>
                            <td>3</td>
                            <td>X</td>
                            <td>
                                <break />
                            </td>
                            <td>
                                <break />
                            </td>
                            <td>
                                <break />
                            </td>
                        </tr>
                        <tr valign="top">
                            <td>Nonexpert 1</td>
                            <td>
                                <break />
                            </td>
                            <td>
                                <break />
                            </td>
                            <td>
                                <break />
                            </td>
                            <td>
                                <break />
                            </td>
                            <td>
                                <break />
                            </td>
                        </tr>
                        <tr valign="top">
                            <td>
                                <break />
                            </td>
                            <td>1</td>
                            <td>X</td>
                            <td>
                                <break />
                            </td>
                            <td>
                                <break />
                            </td>
                            <td>
                                <break />
                            </td>
                        </tr>
                        <tr valign="top">
                            <td>
                                <break />
                            </td>
                            <td>2</td>
                            <td>X</td>
                            <td>
                                <break />
                            </td>
                            <td>
                                <break />
                            </td>
                            <td>
                                <break />
                            </td>
                        </tr>
                        <tr valign="top">
                            <td>
                                <break />
                            </td>
                            <td>3</td>
                            <td>X</td>
                            <td>
                                <break />
                            </td>
                            <td>
                                <break />
                            </td>
                            <td>
                                <break />
                            </td>
                        </tr>
                        <tr valign="top">
                            <td>Nonexpert 2</td>
                            <td>
                                <break />
                            </td>
                            <td>
                                <break />
                            </td>
                            <td>
                                <break />
                            </td>
                            <td>
                                <break />
                            </td>
                            <td>
                                <break />
                            </td>
                        </tr>
                        <tr valign="top">
                            <td>
                                <break />
                            </td>
                            <td>1</td>
                            <td>
                                <break />
                            </td>
                            <td>X</td>
                            <td>
                                <break />
                            </td>
                            <td>
                                <break />
                            </td>
                        </tr>
                        <tr valign="top">
                            <td>
                                <break />
                            </td>
                            <td>2</td>
                            <td>X</td>
                            <td>
                                <break />
                            </td>
                            <td>
                                <break />
                            </td>
                            <td>
                                <break />
                            </td>
                        </tr>
                        <tr valign="top">
                            <td>
                                <break />
                            </td>
                            <td>3</td>
                            <td>X</td>
                            <td>
                                <break />
                            </td>
                            <td>
                                <break />
                            </td>
                            <td>
                                <break />
                            </td>
                        </tr>
                        <tr valign="top">
                            <td>Nonexpert 3</td>
                            <td>
                                <break />
                            </td>
                            <td>
                                <break />
                            </td>
                            <td>
                                <break />
                            </td>
                            <td>
                                <break />
                            </td>
                            <td>
                                <break />
                            </td>
                        </tr>
                        <tr valign="top">
                            <td>
                                <break />
                            </td>
                            <td>1</td>
                            <td>
                                <break />
                            </td>
                            <td>
                                <break />
                            </td>
                            <td>X</td>
                            <td>
                                <break />
                            </td>
                        </tr>
                        <tr valign="top">
                            <td>
                                <break />
                            </td>
                            <td>2</td>
                            <td>
                                <break />
                            </td>
                            <td>
                                <break />
                            </td>
                            <td>X</td>
                            <td>
                                <break />
                            </td>
                        </tr>
                        <tr valign="top">
                            <td>
                                <break />
                            </td>
                            <td>3</td>
                            <td>
                                <break />
                            </td>
                            <td>
                                <break />
                            </td>
                            <td>
                                <break />
                            </td>
                            <td>X</td>
                        </tr>
                    </tbody>
                </table>
            </table-wrap>
            <table-wrap position="float" id="table3">
                <label>Table 3</label>
                <caption>
                    <p>Usability questionnaire results. All results reported on a 5-point scale (1=<italic>very difficult</italic> to 5=<italic>very easy</italic>).</p>
                </caption>
                <table width="590" border="1" cellpadding="7" cellspacing="0" rules="groups" frame="hsides">
                    <col width="103" />
                    <col width="104" />
                    <col width="104" />
                    <col width="104" />
                    <col width="104" />
                    <thead>
                        <tr valign="top">
                            <td>Participant</td>
                            <td>Scenario 1</td>
                            <td>Scenario 2</td>
                            <td>Scenario 3</td>
                            <td>Mean</td>
                        </tr>
                    </thead>
                    <tbody>
                        <tr valign="top">
                            <td>Expert</td>
                            <td>2</td>
                            <td>4</td>
                            <td>2</td>
                            <td>2.67</td>
                        </tr>
                        <tr valign="top">
                            <td>Nonexpert 1</td>
                            <td>4</td>
                            <td>5</td>
                            <td>2</td>
                            <td>3.67</td>
                        </tr>
                        <tr valign="top">
                            <td>Nonexpert 2</td>
                            <td>4</td>
                            <td>5</td>
                            <td>2</td>
                            <td>3.67</td>
                        </tr>
                        <tr valign="top">
                            <td>Nonexpert 3</td>
                            <td>3</td>
                            <td>3</td>
                            <td>2</td>
                            <td>2.67</td>
                        </tr>
                        <tr valign="top">
                            <td>Mean</td>
                            <td>3.25</td>
                            <td>4.25</td>
                            <td>2</td>
                            <td>&#8212;</td>
                        </tr>
                    </tbody>
                </table>
            </table-wrap>
            <table-wrap position="float" id="table4">
                <label>Table 4</label>
                <caption>
                    <p>Comparison of agreement between the participants, NLP preannotation, and PDDI annotations (N=151) in the reference standard during the scenario with NER and NLP preannotation assistance (Scenario 3).</p>
                </caption>
                <table width="522" border="0" cellpadding="8" cellspacing="0" rules="groups" frame="hsides">
                    <col width="86" />
                    <col width="80" />
                    <col width="98" />
                    <col width="86" />
                    <col width="92" />
                    <thead>
                        <tr valign="top">
                            <td>NLP Result</td>
                            <td colspan="2">No mention found</td>
                            <td colspan="2">Mention</td>
                        </tr>
                        <tr valign="bottom">
                            <td>Participant</td>
                            <td>No mention</td>
                            <td>Mention<sup>a</sup>
                            </td>
                            <td>No mention<sup>b</sup>
                            </td>
                            <td>Mention</td>
                        </tr>
                        <tr valign="bottom">
                            <td>
                                <break />
                            </td>
                            <td>NLP FN<sup>f</sup>
                                <break />User FN<break />n (%)</td>
                            <td>NLP FN<break />User TP<break />n (%)</td>
                            <td>NLP TP<sup>c</sup>
                                <break />User FN<break />n (%)</td>
                            <td>NLP TP<break />User TP<break />n (%)</td>
                        </tr>
                    </thead>
                    <tbody>
                        <tr valign="top">
                            <td>Expert</td>
                            <td>59 (39.1)</td>
                            <td>50 (33.1)</td>
                            <td>23 (15.2)</td>
                            <td>19 (12.6)</td>
                        </tr>
                        <tr valign="top">
                            <td>Nonexpert 1</td>
                            <td>46 (30.5)</td>
                            <td>63 (41.7)</td>
                            <td>11 (7.3)</td>
                            <td>31 (20.5)</td>
                        </tr>
                        <tr valign="top">
                            <td>Nonexpert 2</td>
                            <td>43 (28.5)</td>
                            <td>66 (43.7)</td>
                            <td>11 (7.3)</td>
                            <td>31 (20.5)</td>
                        </tr>
                        <tr valign="top">
                            <td>Nonexpert 3</td>
                            <td>49 (32.5)</td>
                            <td>60 (39.7)</td>
                            <td>13 (8.6)</td>
                            <td>29 (19.2)</td>
                        </tr>
                    </tbody>
                </table>
                <table-wrap-foot>
                    <fn id="table4fn1">
                        <p>
                            <sup>a</sup>Indicates case where the user corrected an NLP error.</p>
                    </fn>
                    <fn id="table4fn2">
                        <p>
                            <sup>b</sup>Indicates cases where the NLP was correct and the user was incorrect.</p>
                    </fn>
                    <fn id="table4fn3">
                        <p>
                            <sup>c</sup>FN: false negative</p>
                    </fn>
                    <fn id="table4fn4">
                        <p>
                            <sup>d</sup>TP: true positive</p>
                    </fn>
                </table-wrap-foot>
            </table-wrap>
            <table-wrap position="float" id="table5">
                <label>Table 5</label>
                <caption>
                    <p>Analysis of user and NLP false positives relative to the reference standard for Scenario 3.</p>
                </caption>
                <table width="414" border="1" cellpadding="7" cellspacing="0" rules="groups" frame="hsides">
                    <col width="87" />
                    <col width="88" />
                    <col width="100" />
                    <col width="81" />
                    <thead>
                        <tr valign="top">
                            <td>NLP result</td>
                            <td>No mention</td>
                            <td colspan="2">Mention (n=93)</td>
                        </tr>
                        <tr valign="bottom">
                            <td>Participant</td>
                            <td>Mention<sup>a</sup>
                            </td>
                            <td>No mention<sup>b</sup>
                            </td>
                            <td>Mention</td>
                        </tr>
                        <tr valign="top">
                            <td>
                                <break />
                            </td>
                            <td>NLP TN<break />User FP<break />n</td>
                            <td>NLP FP<break />User TN<break />n (%)</td>
                            <td>NLP FP<break />User FP<break />n (%)</td>
                        </tr>
                    </thead>
                    <tbody>
                        <tr valign="top">
                            <td>Expert</td>
                            <td>25</td>
                            <td>93 (100)</td>
                            <td>0 (0)</td>
                        </tr>
                        <tr valign="top">
                            <td>Nonexpert 1</td>
                            <td>16</td>
                            <td>88 (94.6)</td>
                            <td>5 (5.4)</td>
                        </tr>
                        <tr valign="top">
                            <td>Nonexpert 2</td>
                            <td>37</td>
                            <td>86 (92.5)</td>
                            <td>7 (7.5)</td>
                        </tr>
                        <tr valign="top">
                            <td>Nonexpert 3</td>
                            <td>24</td>
                            <td>88 (94.6)</td>
                            <td>5 (5.4)</td>
                        </tr>
                    </tbody>
                </table>
                <table-wrap-foot>
                    <fn id="table5fn1">
                        <p>
                            <sup>a</sup>Indicates cases where the user identified spans that were not identified by the NLP. <sup>b</sup>Indicates cases where the NLP identified spans that the participant did not annotate.</p>
                    </fn>
                </table-wrap-foot>
            </table-wrap>
            <fig id="figure4" position="float">
                <label>Figure 4</label>
                <caption>
                    <p>Annotator and NLP performance (F1 scores) for each of the four scenarios and overall performance across all four scenarios.</p>
                </caption>
                <graphic xlink:href="resprot_v5i2e40_fig4.jpg" alt-version="no" mimetype="image" position="float" xlink:type="simple" />
            </fig>
        </sec>
        <sec sec-type="discussion">
            <title>Discussion</title>
            <sec>
                <title>Overview</title>
                <p>Our long-term goal is to develop tools that will deliver computable representations of reliable, accurate PDDI information to clinicians, facilitating decision support and hopefully reducing adverse events. The number of drugs that might need to be addressed (more than 16,000) and the complexity of the content in the SPLs make this a daunting task. Our experience in building NLP tools for the extraction of PDDI information [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref14">14</xref>] illustrated some of the difficulty and led us to the conclusion that some amount of manual involvement in the process was required.</p>
                <p>Our goal in this study was to address two key questions in the development of human-assisted processes for curating PDDI information. Specifically, who should conduct the annotation and what sort of assistance should they receive? Although pharmacists and other domain experts familiar with drug information presumably have the background and training necessary to interpret SPLs, annotation by experts is often prohibitively difficult. Thus, we set out to gain some preliminary insight into the practicality of asking participants not specifically trained in drug information to annotate this data. Second, we were interested in understanding what level of assistance might be helpful for users. If our NLP tools were found to speed completion of annotation tasks without reducing accuracy, this would decrease the cost of PDDI annotation even for nonexperts.</p>
            </sec>
            <sec>
                <title>Is It Possible for Nonexperts to Produce Reliable PDDI Annotations From Drug Labels?</title>
                <p>Annotation results from the nonexpert group were relatively strong in every scenario and better than the performance of the NLP pipeline (<xref ref-type="fig" rid="figure4">Figure 4</xref>). These findings suggest that nonexperts might be able to produce reliable PDDI annotations from drug labels with accuracy levels similar to those of experts and that crowdsourcing might be a feasible option for annotating PDDIs across a broader range of drug product labels. Our results are consistent with earlier demonstrations of the feasibility of applying crowdsourcing to related problems in annotation of biomedical texts [<xref ref-type="bibr" rid="ref19">19</xref>-<xref ref-type="bibr" rid="ref22">22</xref>].</p>
                <p>Ensuring the success of nonexpert annotations of PDDI mentions will likely require greater attention to two keys issues: the usability of the annotation tools and the selection of the annotators.</p>
                <p>Although self-reported task completion times (<xref ref-type="table" rid="table2">Table 2</xref>) indicated that two of the nonexperts were able to complete all tasks in times comparable to those of the expert, one nonexpert (Nonexpert 3) needed substantially more time. Differences in F<sub>1</sub> scores (<xref ref-type="table" rid="table1">Table 1</xref>) suggest that annotations provide by Nonexpert 3 were of slightly lower quality than those of the other two nonexperts. The combination of increased task-completion time and lower F<sub>1</sub> scores suggest that Nonexpert 3 may have struggled more than the other participants with the annotation task. In addition, difficulties with the annotation interface prevented one expert user from completing the annotation tasks.</p>
                <p>Despite these difficulties, responses to the usability questions (<xref ref-type="table" rid="table3">Table 3</xref>) were generally positive, suggesting that usability concerns should not be insurmountable. The small sample size and self-reported time results limit our ability to develop a nuanced understanding of specific issues that might have led to increased task completion times or dissatisfaction with the user interface. Observational user studies, including think-aloud feedback from participants, would likely provide insight into usability problems, potential opportunities for redesign [<xref ref-type="bibr" rid="ref39">39</xref>], and any difficulties associated with the longer task completion times and lower performance of Nonexpert 3.</p>
                <p>Results from the repeated no assistance scenario (Scenario 4) do not appear to show any learning effect based on the previous three scenarios. Exposure to the preannotations in scenarios 2 and 3 may have confused participants, pointing out complexities in interpretation of the labels that might have negatively impacted performance.</p>
                <p>Identification of individuals who are likely to produce high-quality results will be a key challenge for successful nonexpert annotation results. Although our nonexpert participants all had relevant educational backgrounds and computer experience, variations in the task completion times and F<sub>1</sub> scores suggest that some participants might find PDDI annotations more approachable than others. Future nonexpert PDDI annotation recruitment might draw on experience from prior efforts in crowdsourcing which have found that appropriate screening and training of participants can help improve outcomes [<xref ref-type="bibr" rid="ref40">40</xref>,<xref ref-type="bibr" rid="ref41">41</xref>].</p>
            </sec>
            <sec>
                <title>What Is the Influence of NLP Assistance on Annotation Quality?</title>
                <p>Most participants perceived PDDI annotation to be easier when NER preannotation was provided. However, the full NLP assistance (Scenario 3: drug mention plus PDDI preannotations) was associated with lower levels of perceived usability for both expert and nonexpert participants (<xref ref-type="table" rid="table2">Table 2</xref>). Complaints about deleting false positives were commonly expressed in the questionnaire data. These results suggest that the performance of the NLP algorithm and the presentation of NLP preannotated PDDIs might have adversely impacted participant performance. Participants suggested several possible improvements, including preannotating with NER and then presenting NLP preannotations only after a section is annotated. The purpose then would be to highlight possibly missed interactions. We think this approach would depend on an NLP algorithm with much better sentence-level performance than the algorithm used in this study.</p>
                <p>Although exploratory, the comparison of the agreement between users, NLP preannotations, and the reference standard (<xref ref-type="table" rid="table4">tables 4</xref> and <xref ref-type="table" rid="table5">5</xref>) suggests several questions for future study. The expert was slightly less likely than the nonexperts to correct NLP false negatives (<xref ref-type="table" rid="table4">Table 4</xref>, column 1), possibly because the expert might have inappropriately used knowledge of the domain or applied an overly strict interpretation of the PDDI identification guidelines. The expert user was also more likely to reject a correct NLP interpretation (<xref ref-type="table" rid="table4">Table 4</xref>, column 3) and more likely to reject an incorrect NLP assertion (<xref ref-type="table" rid="table5">Table 5</xref>, column 2) suggesting that the expert user&#8217;s thought processes were somehow different than those of the nonexperts. It is also possible that the nonexpert agreement with NLP false positives might be associated with greater trust in NLP on the part of the nonexpert participants. Of course, given the small size of this study, it is entirely possible that these participant-level observations are not statistically significant. Subsequent studies involving more participants and including investigation of user thought processes&#8212;perhaps via think-aloud protocols or retrospective interviews&#8212;would be needed to understand these phenomena.</p>
            </sec>
            <sec>
                <title>Limitations</title>
                <p>The generalizability of this study is limited by the small sample size; a larger study would be needed to more accurately characterize the differences between nonexperts, experts, and the NLP annotation. Another potential limitation of our study is that we could not evaluate the characteristics of label sections that might be more difficult to read and annotate by nonexperts. The experimental design attempted to address this concern by balancing the number of sections across each scenario to minimize the effect of differences in difficulty level. The study results might have been influenced by the accuracy of the NLP algorithm and the reliability and usability of the annotation user interface. Interface revisions based on usability might lead to improved performance for experts and nonexperts. Finally, as we did not conduct any debriefing interviews or otherwise assess participant mental states, we are only able to speculate as to factors that might contribute to differences in task performance.</p>
            </sec>
            <sec>
                <title>Conclusions</title>
                <p>Our goal was to explore of use of nonexperts to annotate PDDI mentions in drug product labels. Our results suggest that nonexperts could produce reliable PDDI annotations from drug labels with efficiency comparable to that of an expert annotator with training in pharmacy or pharmaceutics, indicating that the task of extracting PDDIs from drug product labeling might be suitable for crowdsourcing. Although NER preannotation was found useful to both experts and nonexperts, NLP preannotation as implemented in this study seemed to present an obstacle to all participants. A high performance NLP algorithm might still be helpful if NLP preannotations are shown to annotators after a section is annotated, if only to highlight possibly missed interactions. Improvements in the usability of the annotation tool and screening of potential annotators might further increase performance.</p>
            </sec>
        </sec>
    </body>
    <back>
        <app-group>
            <app id="app1">
                <title>Multimedia Appendix 1</title>
                <p>Annotation guidelines provided to study participants.</p>
                <media xlink:href="resprot_v5i2e40_app1.pdf" xlink:title="PDF File (Adobe PDF File), 2MB" />
            </app>
            <app id="app2">
                <title>Multimedia Appendix 2</title>
                <p>Full precision, recall and F1 results for all participants and for the NLP pipeline in each of the four scenarios.</p>
                <media xlink:href="resprot_v5i2e40_app2.pdf" xlink:title="PDF File (Adobe PDF File), 64KB" />
            </app>
            <app id="app3">
                <title>Multimedia Appendix 3</title>
                <p>Subjective questionnaires.</p>
                <media xlink:href="resprot_v5i2e40_app3.pdf" xlink:title="PDF File (Adobe PDF File), 44KB" />
            </app>
            <app id="app4">
                <title>Multimedia Appendix 4</title>
                <p>Subjective responses, Scenario 1.</p>
                <media xlink:href="resprot_v5i2e40_app4.xlsx" xlink:title="XLSX File (Microsoft Excel File), 26KB" />
            </app>
            <app id="app5">
                <title>Multimedia Appendix 5</title>
                <p>Subjective responses, Scenario 2.</p>
                <media xlink:href="resprot_v5i2e40_app5.xlsx" xlink:title="XLSX File (Microsoft Excel File), 29KB" />
            </app>
            <app id="app6">
                <title>Multimedia Appendix 6</title>
                <p>Subjective responses, Scenario 3.</p>
                <media xlink:href="resprot_v5i2e40_app6.xlsx" xlink:title="XLSX File (Microsoft Excel File), 35KB" />
            </app>
            <app id="app7">
                <title>Multimedia Appendix 7</title>
                <p>Subjective responses, Scenario 4.</p>
                <media xlink:href="resprot_v5i2e40_app7.xlsx" xlink:title="XLSX File (Microsoft Excel File), 25KB" />
            </app>
        </app-group>
        <glossary>
            <title>Abbreviations</title>
            <def-list>
                <def-item>
                    <term id="abb1">NER</term>
                    <def>
                        <p>named entity recognizer</p>
                    </def>
                </def-item>
                <def-item>
                    <term id="abb2">NLP</term>
                    <def>
                        <p>natural language processing</p>
                    </def>
                </def-item>
                <def-item>
                    <term id="abb3">SPL</term>
                    <def>
                        <p>structured product label</p>
                    </def>
                </def-item>
                <def-item>
                    <term id="abb4">PDDI</term>
                    <def>
                        <p>potential drug-drug interactions</p>
                    </def>
                </def-item>
            </def-list>
        </glossary>
        <ack>
            <p>Research reported in this paper was partially supported by the Fogarty International Center of Global Health of the National Institutes of Health under grant number 1D43TW008443-01, National Institute on Aging grant K01AG044433, and National Library of Medicine grant 1R01LM011838-01. The content is solely the responsibility of the authors and does not necessarily represent the official views of the National Institutes of Health. We also thank Paolo Ciccarese and Tim Clark for their advice on the development of the PDDI annotation plugin for DOMEO.</p>
        </ack>
        <fn-group>
            <fn fn-type="conflict">
                <p>None declared.</p>
            </fn>
        </fn-group>
        <ref-list>
            <ref id="ref1">
                <label>1</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Magro</surname>
                            <given-names>L</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Moretti</surname>
                            <given-names>U</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Leone</surname>
                            <given-names>R</given-names>
                        </name>
                    </person-group>
                    <article-title>Epidemiology and characteristics of adverse drug reactions caused by drug-drug interactions</article-title>
                    <source>Expert Opin Drug Saf</source>
                    <year>2012</year>
                    <month>01</month>
                    <volume>11</volume>
                    <issue>1</issue>
                    <fpage>83</fpage>
                    <lpage>94</lpage>
                    <pub-id pub-id-type="doi">10.1517/14740338.2012.631910</pub-id>
                    <pub-id pub-id-type="medline">22022824</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref2">
                <label>2</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Hansten</surname>
                            <given-names>PD</given-names>
                        </name>
                    </person-group>
                    <article-title>Drug interaction management</article-title>
                    <source>Pharm World Sci</source>
                    <year>2003</year>
                    <month>06</month>
                    <volume>25</volume>
                    <issue>3</issue>
                    <fpage>94</fpage>
                    <lpage>97</lpage>
                    <pub-id pub-id-type="medline">12840961</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref3">
                <label>3</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Dal-R&#233;</surname>
                            <given-names>R</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Pedromingo</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Garc&#237;a-Losa</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Lahuerta</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Ortega</surname>
                            <given-names>R</given-names>
                        </name>
                    </person-group>
                    <article-title>Are results from pharmaceutical-company-sponsored studies available to the public?</article-title>
                    <source>Eur J Clin Pharmacol</source>
                    <year>2010</year>
                    <month>11</month>
                    <volume>66</volume>
                    <issue>11</issue>
                    <fpage>1081</fpage>
                    <lpage>1089</lpage>
                    <pub-id pub-id-type="doi">10.1007/s00228-010-0898-y</pub-id>
                    <pub-id pub-id-type="medline">20844869</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref4">
                <label>4</label>
                <nlm-citation citation-type="web">
                    <source>Code of Federal Regulations Title 21</source>
                    <access-date>2015-06-10</access-date>
                    <publisher-loc>Washington DC</publisher-loc>
                    <publisher-name>US Food and Drug Administration</publisher-name>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.accessdata.fda.gov/scripts/cdrh/cfdocs/cfcfr/CFRSearch.cfm?fr=201.57">http://www.accessdata.fda.gov/scripts/cdrh/cfdocs/cfcfr/CFRSearch.cfm?fr=201.57</ext-link>
                        <ext-link ext-link-type="webcite" xlink:href="6ZBdCKzvJ" />
                    </comment>
                </nlm-citation>
            </ref>
            <ref id="ref5">
                <label>5</label>
                <nlm-citation citation-type="web">
                    <source>Guidance for industry: indexing structured product labeling</source>
                    <access-date>2015-11-25</access-date>
                    <publisher-loc>Washington DC</publisher-loc>
                    <publisher-name>US Food and Drug Admininstration</publisher-name>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.fda.gov/downloads/Drugs/GuidanceComplianceRegulatoryInformation/Guidances/ucm072317.pdf">http://www.fda.gov/downloads/Drugs/GuidanceComplianceRegulatoryInformation/Guidances/ucm072317.pdf</ext-link>
                        <ext-link ext-link-type="webcite" xlink:href="6dJGbbaTV" />
                    </comment>
                </nlm-citation>
            </ref>
            <ref id="ref6">
                <label>6</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Hines</surname>
                            <given-names>LE</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Ceron-Cabrera</surname>
                            <given-names>D</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Romero</surname>
                            <given-names>K</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Anthony</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Woosley</surname>
                            <given-names>RL</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Armstrong</surname>
                            <given-names>EP</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Malone</surname>
                            <given-names>DC</given-names>
                        </name>
                    </person-group>
                    <article-title>Evaluation of warfarin drug interaction listings in US product information for warfarin and interacting drugs</article-title>
                    <source>Clin Ther</source>
                    <year>2011</year>
                    <month>01</month>
                    <volume>33</volume>
                    <issue>1</issue>
                    <fpage>36</fpage>
                    <lpage>45</lpage>
                    <pub-id pub-id-type="doi">10.1016/j.clinthera.2011.01.021</pub-id>
                    <pub-id pub-id-type="medline">21397772</pub-id>
                    <pub-id pub-id-type="pii">S0149-2918(11)00068-3</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref7">
                <label>7</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Pfistermeister</surname>
                            <given-names>B</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Sa&#223;</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Criegee-Rieck</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>B&#252;rkle</surname>
                            <given-names>T</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Fromm</surname>
                            <given-names>MF</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Maas</surname>
                            <given-names>R</given-names>
                        </name>
                    </person-group>
                    <article-title>Inconsistencies and misleading information in officially approved prescribing information from three major drug markets</article-title>
                    <source>Clin Pharmacol Ther</source>
                    <year>2014</year>
                    <month>11</month>
                    <volume>96</volume>
                    <issue>5</issue>
                    <fpage>616</fpage>
                    <lpage>624</lpage>
                    <pub-id pub-id-type="doi">10.1038/clpt.2014.156</pub-id>
                    <pub-id pub-id-type="medline">25062063</pub-id>
                    <pub-id pub-id-type="pii">clpt2014156</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref8">
                <label>8</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Ayvaz</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Horn</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Hassanzadeh</surname>
                            <given-names>O</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Zhu</surname>
                            <given-names>Q</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Stan</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Tatonetti</surname>
                            <given-names>NP</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Vilar</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Brochhausen</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Samwald</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Rastegar-Mojarad</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Dumontier</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Boyce</surname>
                            <given-names>RD</given-names>
                        </name>
                    </person-group>
                    <article-title>Toward a complete dataset of drug-drug interaction information from publicly available sources</article-title>
                    <source>J Biomed Inform</source>
                    <year>2015</year>
                    <month>06</month>
                    <volume>55</volume>
                    <fpage>206</fpage>
                    <lpage>217</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://linkinghub.elsevier.com/retrieve/pii/S1532-0464(15)00073-8" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1016/j.jbi.2015.04.006</pub-id>
                    <pub-id pub-id-type="medline">25917055</pub-id>
                    <pub-id pub-id-type="pii">S1532-0464(15)00073-8</pub-id>
                    <pub-id pub-id-type="pmcid">PMC4464899</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref9">
                <label>9</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Marshall</surname>
                            <given-names>MS</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Boyce</surname>
                            <given-names>R</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Deus</surname>
                            <given-names>HF</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Zhao</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Willighagen</surname>
                            <given-names>EL</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Samwald</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Pichler</surname>
                            <given-names>E</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Hajagos</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Prud&#8217;hommeaux</surname>
                            <given-names>E</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Stephens</surname>
                            <given-names>S</given-names>
                        </name>
                    </person-group>
                    <article-title>Emerging practices for mapping and linking life sciences data using RDF: a case series</article-title>
                    <source>Web Semantics: Science, Services and Agents on the World Wide Web</source>
                    <year>2012</year>
                    <month>7</month>
                    <volume>14</volume>
                    <issue>4</issue>
                    <fpage>2</fpage>
                    <lpage>13</lpage>
                    <pub-id pub-id-type="doi">10.1016/j.websem.2012.02.003</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref10">
                <label>10</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Boyce</surname>
                            <given-names>RD</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Horn</surname>
                            <given-names>JR</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Hassanzadeh</surname>
                            <given-names>O</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Waard</surname>
                            <given-names>AD</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Schneider</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Luciano</surname>
                            <given-names>JS</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Rastegar-Mojarad</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Liakata</surname>
                            <given-names>M</given-names>
                        </name>
                    </person-group>
                    <article-title>Dynamic enhancement of drug product labels to support drug safety, efficacy, and effectiveness</article-title>
                    <source>J Biomed Semantics</source>
                    <year>2013</year>
                    <volume>4</volume>
                    <issue>1</issue>
                    <fpage>5</fpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://jbiomedsem.biomedcentral.com/articles/10.1186/2041-1480-4-5" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1186/2041-1480-4-5</pub-id>
                    <pub-id pub-id-type="medline">23351881</pub-id>
                    <pub-id pub-id-type="pii">2041-1480-4-5</pub-id>
                    <pub-id pub-id-type="pmcid">PMC3698101</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref11">
                <label>11</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Brown</surname>
                            <given-names>SH</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Elkin</surname>
                            <given-names>PL</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Rosenbloom</surname>
                            <given-names>ST</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Husser</surname>
                            <given-names>C</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Bauer</surname>
                            <given-names>BA</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Lincoln</surname>
                            <given-names>MJ</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Carter</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Erlbaum</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Tuttle</surname>
                            <given-names>MS</given-names>
                        </name>
                    </person-group>
                    <article-title>VA National Drug File Reference Terminology: a cross-institutional content coverage study</article-title>
                    <source>Stud Health Technol Inform</source>
                    <year>2004</year>
                    <volume>107</volume>
                    <issue>Pt 1</issue>
                    <fpage>477</fpage>
                    <lpage>481</lpage>
                    <pub-id pub-id-type="medline">15360858</pub-id>
                    <pub-id pub-id-type="pii">D040004553</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref12">
                <label>12</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Olvey</surname>
                            <given-names>E L</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Clauschee</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Malone</surname>
                            <given-names>DC</given-names>
                        </name>
                    </person-group>
                    <article-title>Comparison of critical drug-drug interaction listings: the Department of Veterans Affairs medical system and standard reference compendia</article-title>
                    <source>Clin Pharmacol Ther</source>
                    <year>2010</year>
                    <month>01</month>
                    <volume>87</volume>
                    <issue>1</issue>
                    <fpage>48</fpage>
                    <lpage>51</lpage>
                    <pub-id pub-id-type="doi">10.1038/clpt.2009.198</pub-id>
                    <pub-id pub-id-type="medline">19890252</pub-id>
                    <pub-id pub-id-type="pii">clpt2009198</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref13">
                <label>13</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Bui</surname>
                            <given-names>Q</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Sloot</surname>
                            <given-names>PM</given-names>
                        </name>
                        <name name-style="western">
                            <surname>van Mulligen</surname>
                            <given-names>EM</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Kors</surname>
                            <given-names>JA</given-names>
                        </name>
                    </person-group>
                    <article-title>A novel feature-based approach to extract drug-drug interactions from biomedical text</article-title>
                    <source>Bioinformatics</source>
                    <year>2014</year>
                    <month>12</month>
                    <day>1</day>
                    <volume>30</volume>
                    <issue>23</issue>
                    <fpage>3365</fpage>
                    <lpage>3371</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://bioinformatics.oxfordjournals.org/cgi/pmidlookup?view=long&#38;pmid=25143286" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1093/bioinformatics/btu557</pub-id>
                    <pub-id pub-id-type="medline">25143286</pub-id>
                    <pub-id pub-id-type="pii">btu557</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref14">
                <label>14</label>
                <nlm-citation citation-type="confproc">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Boyce</surname>
                            <given-names>R</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Gardner</surname>
                            <given-names>G</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Harkema</surname>
                            <given-names>H</given-names>
                        </name>
                    </person-group>
                    <article-title>Using natural language processing to identify pharmacokinetic drug-drug interactions described in drug package inserts</article-title>
                    <year>2012</year>
                    <month>05</month>
                    <day>07</day>
                    <conf-name>Proceedings of the  Workshop on Biomedical Natural Language Processing</conf-name>
                    <conf-date>2012</conf-date>
                    <conf-loc>Montreal, Quebec, Canada</conf-loc>
                    <fpage>206</fpage>
                    <lpage>213</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://dl.acm.org/citation.cfm?id=2391151" />
                    </comment>
                </nlm-citation>
            </ref>
            <ref id="ref15">
                <label>15</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Rzhetsky</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Shatkay</surname>
                            <given-names>H</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Wilbur</surname>
                            <given-names>WJ</given-names>
                        </name>
                    </person-group>
                    <article-title>How to get the most out of your curation effort</article-title>
                    <source>PLoS Comput Biol</source>
                    <year>2009</year>
                    <month>05</month>
                    <volume>5</volume>
                    <issue>5</issue>
                    <fpage>e1000391</fpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pcbi.1000391" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1371/journal.pcbi.1000391</pub-id>
                    <pub-id pub-id-type="medline">19461884</pub-id>
                    <pub-id pub-id-type="pmcid">PMC2678295</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref16">
                <label>16</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Good</surname>
                            <given-names>BM</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Su</surname>
                            <given-names>AI</given-names>
                        </name>
                    </person-group>
                    <article-title>Crowdsourcing for bioinformatics</article-title>
                    <source>Bioinformatics</source>
                    <year>2013</year>
                    <month>08</month>
                    <day>15</day>
                    <volume>29</volume>
                    <issue>16</issue>
                    <fpage>1925</fpage>
                    <lpage>1933</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://bioinformatics.oxfordjournals.org/cgi/pmidlookup?view=long&#38;pmid=23782614" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1093/bioinformatics/btt333</pub-id>
                    <pub-id pub-id-type="medline">23782614</pub-id>
                    <pub-id pub-id-type="pii">btt333</pub-id>
                    <pub-id pub-id-type="pmcid">PMC3722523</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref17">
                <label>17</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>MacLean</surname>
                            <given-names>DL</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Heer</surname>
                            <given-names>J</given-names>
                        </name>
                    </person-group>
                    <article-title>Identifying medical terms in patient-authored text: a crowdsourcing-based approach</article-title>
                    <source>J Am Med Inform Assoc</source>
                    <year>2013</year>
                    <volume>20</volume>
                    <issue>6</issue>
                    <fpage>1120</fpage>
                    <lpage>1127</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://jamia.oxfordjournals.org/cgi/pmidlookup?view=long&#38;pmid=23645553" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1136/amiajnl-2012-001110</pub-id>
                    <pub-id pub-id-type="medline">23645553</pub-id>
                    <pub-id pub-id-type="pii">amiajnl-2012-001110</pub-id>
                    <pub-id pub-id-type="pmcid">PMC3822103</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref18">
                <label>18</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Khare</surname>
                            <given-names>R</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Good</surname>
                            <given-names>BM</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Leaman</surname>
                            <given-names>R</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Su</surname>
                            <given-names>AI</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Lu</surname>
                            <given-names>Z</given-names>
                        </name>
                    </person-group>
                    <article-title>Crowdsourcing in biomedicine: challenges and opportunities</article-title>
                    <source>Brief Bioinform</source>
                    <year>2016</year>
                    <month>01</month>
                    <volume>17</volume>
                    <issue>1</issue>
                    <fpage>23</fpage>
                    <lpage>32</lpage>
                    <pub-id pub-id-type="doi">10.1093/bib/bbv021</pub-id>
                    <pub-id pub-id-type="medline">25888696</pub-id>
                    <pub-id pub-id-type="pii">bbv021</pub-id>
                    <pub-id pub-id-type="pmcid">PMC4719068</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref19">
                <label>19</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Uzuner</surname>
                            <given-names>O</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Solti</surname>
                            <given-names>I</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Xia</surname>
                            <given-names>F</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Cadag</surname>
                            <given-names>E</given-names>
                        </name>
                    </person-group>
                    <article-title>Community annotation experiment for ground truth generation for the i2b2 medication challenge</article-title>
                    <source>J Am Med Inform Assoc</source>
                    <year>2010</year>
                    <volume>17</volume>
                    <issue>5</issue>
                    <fpage>519</fpage>
                    <lpage>523</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://jamia.oxfordjournals.org/cgi/pmidlookup?view=long&#38;pmid=20819855" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1136/jamia.2010.004200</pub-id>
                    <pub-id pub-id-type="medline">20819855</pub-id>
                    <pub-id pub-id-type="pii">17/5/519</pub-id>
                    <pub-id pub-id-type="pmcid">PMC2995684</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref20">
                <label>20</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Burger</surname>
                            <given-names>JD</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Doughty</surname>
                            <given-names>E</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Khare</surname>
                            <given-names>R</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Wei</surname>
                            <given-names>C</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Mishra</surname>
                            <given-names>R</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Aberdeen</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Tresner-Kirsch</surname>
                            <given-names>D</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Wellner</surname>
                            <given-names>B</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Kann</surname>
                            <given-names>MG</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Lu</surname>
                            <given-names>Z</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Hirschman</surname>
                            <given-names>L</given-names>
                        </name>
                    </person-group>
                    <article-title>Hybrid curation of gene-mutation relations combining automated extraction and crowdsourcing</article-title>
                    <source>Database (Oxford)</source>
                    <year>2014</year>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.database.oxfordjournals.org/cgi/pmidlookup?view=long&#38;pmid=25246425" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1093/database/bau094</pub-id>
                    <pub-id pub-id-type="medline">25246425</pub-id>
                    <pub-id pub-id-type="pii">bau094</pub-id>
                    <pub-id pub-id-type="pmcid">PMC4170591</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref21">
                <label>21</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Zhai</surname>
                            <given-names>H</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Lingren</surname>
                            <given-names>T</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Deleger</surname>
                            <given-names>L</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Li</surname>
                            <given-names>Q</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Kaiser</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Stoutenborough</surname>
                            <given-names>L</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Solti</surname>
                            <given-names>I</given-names>
                        </name>
                    </person-group>
                    <article-title>Web 2.0-based crowdsourcing for high-quality gold standard development in clinical natural language processing</article-title>
                    <source>J Med Internet Res</source>
                    <year>2013</year>
                    <volume>15</volume>
                    <issue>4</issue>
                    <fpage>e73</fpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jmir.org/2013/4/e73/" />
                    </comment>
                    <pub-id pub-id-type="doi">10.2196/jmir.2426</pub-id>
                    <pub-id pub-id-type="medline">23548263</pub-id>
                    <pub-id pub-id-type="pii">v15i4e73</pub-id>
                    <pub-id pub-id-type="pmcid">PMC3636329</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref22">
                <label>22</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Khare</surname>
                            <given-names>R</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Burger</surname>
                            <given-names>JD</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Aberdeen</surname>
                            <given-names>JS</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Tresner-Kirsch</surname>
                            <given-names>DW</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Corrales</surname>
                            <given-names>TJ</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Hirchman</surname>
                            <given-names>L</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Lu</surname>
                            <given-names>Z</given-names>
                        </name>
                    </person-group>
                    <article-title>Scaling drug indication curation through crowdsourcing</article-title>
                    <source>Database (Oxford)</source>
                    <year>2015</year>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.database.oxfordjournals.org/cgi/pmidlookup?view=long&#38;pmid=25797061" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1093/database/bav016</pub-id>
                    <pub-id pub-id-type="medline">25797061</pub-id>
                    <pub-id pub-id-type="pii">bav016</pub-id>
                    <pub-id pub-id-type="pmcid">PMC4369375</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref23">
                <label>23</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>McCoy</surname>
                            <given-names>AB</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Wright</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Krousel-Wood</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Thomas</surname>
                            <given-names>EJ</given-names>
                        </name>
                        <name name-style="western">
                            <surname>McCoy</surname>
                            <given-names>JA</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Sittig</surname>
                            <given-names>DF</given-names>
                        </name>
                    </person-group>
                    <article-title>Validation of a Crowdsourcing Methodology for Developing a Knowledge Base of Related Problem-Medication Pairs</article-title>
                    <source>Appl Clin Inform</source>
                    <year>2015</year>
                    <volume>6</volume>
                    <issue>2</issue>
                    <fpage>334</fpage>
                    <lpage>344</lpage>
                    <pub-id pub-id-type="doi">10.4338/ACI-2015-01-RA-0010</pub-id>
                    <pub-id pub-id-type="medline">26171079</pub-id>
                    <pub-id pub-id-type="pmcid">PMC4493334</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref24">
                <label>24</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>McCoy</surname>
                            <given-names>AB</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Wright</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Laxmisan</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Ottosen</surname>
                            <given-names>MJ</given-names>
                        </name>
                        <name name-style="western">
                            <surname>McCoy</surname>
                            <given-names>JA</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Butten</surname>
                            <given-names>D</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Sittig</surname>
                            <given-names>DF</given-names>
                        </name>
                    </person-group>
                    <article-title>Development and evaluation of a crowdsourcing methodology for knowledge base construction: identifying relationships between clinical problems and medications</article-title>
                    <source>J Am Med Inform Assoc</source>
                    <year>2012</year>
                    <volume>19</volume>
                    <issue>5</issue>
                    <fpage>713</fpage>
                    <lpage>718</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://jamia.oxfordjournals.org/cgi/pmidlookup?view=long&#38;pmid=22582202" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1136/amiajnl-2012-000852</pub-id>
                    <pub-id pub-id-type="medline">22582202</pub-id>
                    <pub-id pub-id-type="pii">amiajnl-2012-000852</pub-id>
                    <pub-id pub-id-type="pmcid">PMC3422843</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref25">
                <label>25</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Vreeman</surname>
                            <given-names>DJ</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Hook</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Dixon</surname>
                            <given-names>BE</given-names>
                        </name>
                    </person-group>
                    <article-title>Learning from the crowd while mapping to LOINC</article-title>
                    <source>J Am Med Inform Assoc</source>
                    <year>2015</year>
                    <month>11</month>
                    <volume>22</volume>
                    <issue>6</issue>
                    <fpage>1205</fpage>
                    <lpage>1211</lpage>
                    <pub-id pub-id-type="doi">10.1093/jamia/ocv098</pub-id>
                    <pub-id pub-id-type="medline">26224334</pub-id>
                    <pub-id pub-id-type="pii">ocv098</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref26">
                <label>26</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Dixon</surname>
                            <given-names>BE</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Hook</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Vreeman</surname>
                            <given-names>DJ</given-names>
                        </name>
                    </person-group>
                    <article-title>Learning from the crowd in terminology mapping: the LOINC experience</article-title>
                    <source>Lab Med</source>
                    <year>2015</year>
                    <volume>46</volume>
                    <issue>2</issue>
                    <fpage>168</fpage>
                    <lpage>174</lpage>
                    <pub-id pub-id-type="doi">10.1309/LMWJ730SVKTUBAOJ</pub-id>
                    <pub-id pub-id-type="medline">25918199</pub-id>
                    <pub-id pub-id-type="pii">46/2/168</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref27">
                <label>27</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Hanauer</surname>
                            <given-names>D</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Aberdeen</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Bayer</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Wellner</surname>
                            <given-names>B</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Clark</surname>
                            <given-names>C</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Zheng</surname>
                            <given-names>K</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Hirschman</surname>
                            <given-names>L</given-names>
                        </name>
                    </person-group>
                    <article-title>Bootstrapping a de-identification system for narrative patient records: cost-performance tradeoffs</article-title>
                    <source>Int J Med Inform</source>
                    <year>2013</year>
                    <month>09</month>
                    <volume>82</volume>
                    <issue>9</issue>
                    <fpage>821</fpage>
                    <lpage>831</lpage>
                    <pub-id pub-id-type="doi">10.1016/j.ijmedinf.2013.03.005</pub-id>
                    <pub-id pub-id-type="medline">23643147</pub-id>
                    <pub-id pub-id-type="pii">S1386-5056(13)00063-4</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref28">
                <label>28</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Gobbel</surname>
                            <given-names>GT</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Garvin</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Reeves</surname>
                            <given-names>R</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Cronin</surname>
                            <given-names>RM</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Heavirland</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Williams</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Weaver</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Jayaramaraja</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Giuse</surname>
                            <given-names>D</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Speroff</surname>
                            <given-names>T</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Brown</surname>
                            <given-names>SH</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Xu</surname>
                            <given-names>H</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Matheny</surname>
                            <given-names>ME</given-names>
                        </name>
                    </person-group>
                    <article-title>Assisted annotation of medical free text using RapTAT</article-title>
                    <source>J Am Med Inform Assoc</source>
                    <year>2014</year>
                    <volume>21</volume>
                    <issue>5</issue>
                    <fpage>833</fpage>
                    <lpage>841</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://jamia.oxfordjournals.org/cgi/pmidlookup?view=long&#38;pmid=24431336" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1136/amiajnl-2013-002255</pub-id>
                    <pub-id pub-id-type="medline">24431336</pub-id>
                    <pub-id pub-id-type="pii">amiajnl-2013-002255</pub-id>
                    <pub-id pub-id-type="pmcid">PMC4147611</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref29">
                <label>29</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Lingren</surname>
                            <given-names>T</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Deleger</surname>
                            <given-names>L</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Molnar</surname>
                            <given-names>K</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Zhai</surname>
                            <given-names>H</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Meinzen-Derr</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Kaiser</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Stoutenborough</surname>
                            <given-names>L</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Li</surname>
                            <given-names>Q</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Solti</surname>
                            <given-names>I</given-names>
                        </name>
                    </person-group>
                    <article-title>Evaluating the impact of pre-annotation on annotation speed and potential bias: natural language processing gold standard development for clinical named entity recognition in clinical trial announcements</article-title>
                    <source>J Am Med Inform Assoc</source>
                    <year>2014</year>
                    <volume>21</volume>
                    <issue>3</issue>
                    <fpage>406</fpage>
                    <lpage>413</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://jamia.oxfordjournals.org/cgi/pmidlookup?view=long&#38;pmid=24001514" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1136/amiajnl-2013-001837</pub-id>
                    <pub-id pub-id-type="medline">24001514</pub-id>
                    <pub-id pub-id-type="pii">amiajnl-2013-001837</pub-id>
                    <pub-id pub-id-type="pmcid">PMC3994857</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref30">
                <label>30</label>
                <nlm-citation citation-type="confproc">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Fort</surname>
                            <given-names>K</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Sagot</surname>
                            <given-names>B</given-names>
                        </name>
                    </person-group>
                    <article-title>Influence of pre-annotation on POS-tagged corpus development</article-title>
                    <year>2010</year>
                    <conf-name>Proceedings of the Fourth Linguistic Annotation Workshop</conf-name>
                    <conf-date>7/15/2010</conf-date>
                    <conf-loc>Uppsala, Sweden</conf-loc>
                    <fpage>56</fpage>
                    <lpage>63</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.aclweb.org/anthology/W10-1807" />
                    </comment>
                </nlm-citation>
            </ref>
            <ref id="ref31">
                <label>31</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>South</surname>
                            <given-names>BR</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Mowery</surname>
                            <given-names>D</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Suo</surname>
                            <given-names>Y</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Leng</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Ferr&#225;ndez</surname>
                            <given-names>ÃƒÆ’Ã†â€™Ãƒâ€ Ã¢â‚¬â„¢ÃƒÆ’Ã¢â‚¬Â ÃƒÂ¢Ã¢â€šÂ¬Ã¢â€žÂ¢ÃƒÆ’Ã†â€™ÃƒÂ¢Ã¢â€šÂ¬Ã‚Â ÃƒÆ’Ã‚Â¢ÃƒÂ¢Ã¢â‚¬Å¡Ã‚Â¬ÃƒÂ¢Ã¢â‚¬Å¾Ã‚Â¢ÃƒÆ’Ã†â€™Ãƒâ€ Ã¢â‚¬â„¢ÃƒÆ’Ã‚Â¢ÃƒÂ¢Ã¢â‚¬Å¡Ã‚Â¬Ãƒâ€šÃ‚Â ÃƒÆ’Ã†â€™Ãƒâ€šÃ‚Â¢ÃƒÆ’Ã‚Â¢ÃƒÂ¢Ã¢â€šÂ¬Ã…Â¡Ãƒâ€šÃ‚Â¬ÃƒÆ’Ã‚Â¢ÃƒÂ¢Ã¢â€šÂ¬Ã…Â¾Ãƒâ€šÃ‚Â¢ÃƒÆ’Ã†â€™Ãƒâ€ Ã¢â‚¬â„¢ÃƒÆ’Ã¢â‚¬Â ÃƒÂ¢Ã¢â€šÂ¬Ã¢â€žÂ¢ÃƒÆ’Ã†â€™ÃƒÂ¢Ã¢â€šÂ¬Ã…Â¡ÃƒÆ’Ã¢â‚¬Å¡Ãƒâ€šÃ‚Â¢ÃƒÆ’Ã†â€™Ãƒâ€ Ã¢â‚¬â„¢ÃƒÆ’Ã¢â‚¬Å¡Ãƒâ€šÃ‚Â¢ÃƒÆ’Ã†â€™Ãƒâ€šÃ‚Â¢ÃƒÆ’Ã‚Â¢ÃƒÂ¢Ã¢â€šÂ¬Ã…Â¡Ãƒâ€šÃ‚Â¬ÃƒÆ’Ã¢â‚¬Â¦Ãƒâ€šÃ‚Â¡ÃƒÆ’Ã†â€™ÃƒÂ¢Ã¢â€šÂ¬Ã…Â¡ÃƒÆ’Ã¢â‚¬Å¡Ãƒâ€šÃ‚Â¬ÃƒÆ’Ã†â€™Ãƒâ€ Ã¢â‚¬â„¢ÃƒÆ’Ã‚Â¢ÃƒÂ¢Ã¢â‚¬Å¡Ã‚Â¬Ãƒâ€šÃ‚Â¦ÃƒÆ’Ã†â€™Ãƒâ€šÃ‚Â¢ÃƒÆ’Ã‚Â¢ÃƒÂ¢Ã¢â€šÂ¬Ã…Â¡Ãƒâ€šÃ‚Â¬ÃƒÆ’Ã¢â‚¬Â¦ÃƒÂ¢Ã¢â€šÂ¬Ã…â€œ</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Meystre</surname>
                            <given-names>SM</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Chapman</surname>
                            <given-names>WW</given-names>
                        </name>
                    </person-group>
                    <article-title>Evaluating the effects of machine pre-annotation and an interactive annotation interface on manual de-identification of clinical text</article-title>
                    <source>J Biomed Inform</source>
                    <year>2014</year>
                    <month>08</month>
                    <volume>50</volume>
                    <fpage>162</fpage>
                    <lpage>172</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://linkinghub.elsevier.com/retrieve/pii/S1532-0464(14)00119-1" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1016/j.jbi.2014.05.002</pub-id>
                    <pub-id pub-id-type="medline">24859155</pub-id>
                    <pub-id pub-id-type="pii">S1532-0464(14)00119-1</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref32">
                <label>32</label>
                <nlm-citation citation-type="web">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Boyce</surname>
                            <given-names>R</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Guzman</surname>
                            <given-names>R</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Gardner</surname>
                            <given-names>G</given-names>
                        </name>
                    </person-group>
                    <source>SPL Drug Name Entity Recognizer</source>
                    <access-date>2015-06-09</access-date>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://github.com/dbmi-pitt/u-of-pitt-SPL-drug-NER">https://github.com/dbmi-pitt/u-of-pitt-SPL-drug-NER</ext-link>
                        <ext-link ext-link-type="webcite" xlink:href="6ZAD5y4tT" />
                    </comment>
                </nlm-citation>
            </ref>
            <ref id="ref33">
                <label>33</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Shah</surname>
                            <given-names>NH</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Bhatia</surname>
                            <given-names>N</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Jonquet</surname>
                            <given-names>C</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Rubin</surname>
                            <given-names>D</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Chiang</surname>
                            <given-names>AP</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Musen</surname>
                            <given-names>MA</given-names>
                        </name>
                    </person-group>
                    <article-title>Comparison of concept recognizers for building the Open Biomedical Annotator</article-title>
                    <source>BMC Bioinformatics</source>
                    <year>2009</year>
                    <volume>10 Suppl 9</volume>
                    <fpage>S14</fpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://bmcbioinformatics.biomedcentral.com/articles/10.1186/1471-2105-10-S9-S14" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1186/1471-2105-10-S9-S14</pub-id>
                    <pub-id pub-id-type="medline">19761568</pub-id>
                    <pub-id pub-id-type="pii">1471-2105-10-S9-S14</pub-id>
                    <pub-id pub-id-type="pmcid">PMC2745685</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref34">
                <label>34</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Miller</surname>
                            <given-names>GA</given-names>
                        </name>
                    </person-group>
                    <article-title>WordNet: a lexical database for English</article-title>
                    <source>Commun. ACM</source>
                    <year>1995</year>
                    <volume>38</volume>
                    <issue>11</issue>
                    <fpage>39</fpage>
                    <lpage>41</lpage>
                    <pub-id pub-id-type="doi">10.1145/219717.219748</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref35">
                <label>35</label>
                <nlm-citation citation-type="web">
                    <source>World Wide Web Consortium (W3C)</source>
                    <access-date>2015-06-11</access-date>
                    <comment>W3C Open Annotation Data Model<ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.openannotation.org/spec/core/">http://www.openannotation.org/spec/core/</ext-link>
                        <ext-link ext-link-type="webcite" xlink:href="6ZD4c1fEe" />
                    </comment>
                </nlm-citation>
            </ref>
            <ref id="ref36">
                <label>36</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Ciccarese</surname>
                            <given-names>P</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Shotton</surname>
                            <given-names>D</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Peroni</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Clark</surname>
                            <given-names>T</given-names>
                        </name>
                    </person-group>
                    <article-title>CiTO + SWAN: The web semantics of bibliographic records, citations, evidence and discourse relationships</article-title>
                    <source>Semantic Web</source>
                    <year>2012</year>
                    <fpage>1</fpage>
                    <lpage>28</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.semantic-web-journal.net/content/cito-swan-web-semantics-bibliographic-records-citations-evidence-and-discourse-relationships" />
                    </comment>
                </nlm-citation>
            </ref>
            <ref id="ref37">
                <label>37</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Ciccarese</surname>
                            <given-names>P</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Ocana</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Garcia Castro</surname>
                            <given-names>LJ</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Das</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Clark</surname>
                            <given-names>T</given-names>
                        </name>
                    </person-group>
                    <article-title>An open annotation ontology for science on web 3.0</article-title>
                    <source>J Biomed Semantics</source>
                    <year>2011</year>
                    <volume>2 Suppl 2</volume>
                    <fpage>S4</fpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://jbiomedsem.biomedcentral.com/articles/10.1186/2041-1480-2-S2-S4" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1186/2041-1480-2-S2-S4</pub-id>
                    <pub-id pub-id-type="medline">21624159</pub-id>
                    <pub-id pub-id-type="pii">2041-1480-2-S2-S4</pub-id>
                    <pub-id pub-id-type="pmcid">PMC3102893</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref38">
                <label>38</label>
                <nlm-citation citation-type="web">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Ning</surname>
                            <given-names>Y</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Hernandez</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Hochheiser</surname>
                            <given-names>H</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Ciccarese</surname>
                            <given-names>P</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Boyce</surname>
                            <given-names>R</given-names>
                        </name>
                    </person-group>
                    <source>DOMEO Client Drug-drug Interaction Plugin</source>
                    <access-date>2015-06-10</access-date>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://github.com/rkboyce/DomeoClient">https://github.com/rkboyce/DomeoClient</ext-link>
                        <ext-link ext-link-type="webcite" xlink:href="6ZBq8SVE0" />
                    </comment>
                </nlm-citation>
            </ref>
            <ref id="ref39">
                <label>39</label>
                <nlm-citation citation-type="book">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Lazar</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Feng</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Hochheiser</surname>
                            <given-names>H</given-names>
                        </name>
                    </person-group>
                    <source>Research Methods in Human-Computer Interaction</source>
                    <year>2009</year>
                    <publisher-loc>London</publisher-loc>
                    <publisher-name>Wiley</publisher-name>
                </nlm-citation>
            </ref>
            <ref id="ref40">
                <label>40</label>
                <nlm-citation citation-type="confproc">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Downs</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Holbrook</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Sheng</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Cranor</surname>
                            <given-names>L</given-names>
                        </name>
                    </person-group>
                    <article-title>Are your participants gaming the system? Screening Mechanical Turk workers</article-title>
                    <year>2010</year>
                    <conf-name>Proceedings of the SIGCHI Conference on Human Factors in Computing Systems</conf-name>
                    <conf-date>April 10-15, 2010</conf-date>
                    <conf-loc>Atlanta, GA</conf-loc>
                    <fpage>2399</fpage>
                    <lpage>2402</lpage>
                    <pub-id pub-id-type="doi">10.1145/1753326.1753688</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref41">
                <label>41</label>
                <nlm-citation citation-type="confproc">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Mitra</surname>
                            <given-names>T</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Hutto</surname>
                            <given-names>C</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Gilbert</surname>
                            <given-names>E</given-names>
                        </name>
                    </person-group>
                    <article-title>Comparing person- and process-centric strategies for obtaining quality data on Amazon Mechanical Turk</article-title>
                    <year>2015</year>
                    <conf-name>Proceedings of the 33rd Annual ACM Conference on Human Factors in Computing Systems</conf-name>
                    <conf-date>2015</conf-date>
                    <conf-loc>Seoul, Republic of Korea</conf-loc>
                    <fpage>1345</fpage>
                    <lpage>1354</lpage>
                    <pub-id pub-id-type="doi">10.1145/2702123.2702553</pub-id>
                </nlm-citation>
            </ref>
        </ref-list>
    </back>
</article>