<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">ResProt</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Res Protoc</journal-id>
      <journal-title>JMIR Research Protocols</journal-title>
      <issn pub-type="epub">1929-0748</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v8i5e11448</article-id>
      <article-id pub-id-type="pmid">31066711</article-id>
      <article-id pub-id-type="doi">10.2196/11448</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Protocol</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Protocol</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>The Adverse Drug Reactions From Patient Reports in Social Media Project: Protocol for an Evaluation Against a Gold Standard</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Kuter</surname>
            <given-names>Nicola</given-names>
          </name>
        </contrib>
        <contrib contrib-type="editor">
          <name>
            <surname>Eysenbach</surname>
            <given-names>Gunther</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Kass-Hout</surname>
            <given-names>Taha</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Cossin</surname>
            <given-names>Sébastien</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="author" id="contrib1">
          <name name-style="western">
            <surname>Arnoux-Guenegou</surname>
            <given-names>Armelle</given-names>
          </name>
          <degrees>MSc, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">http://orcid.org/0000-0003-3427-7086</ext-link>
        </contrib>
        <contrib contrib-type="author" id="contrib2">
          <name name-style="western">
            <surname>Girardeau</surname>
            <given-names>Yannick</given-names>
          </name>
          <degrees>MSc, MD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">http://orcid.org/0000-0003-3980-0104</ext-link>
        </contrib>
        <contrib contrib-type="author" id="contrib3" corresp="yes">
          <name name-style="western">
            <surname>Chen</surname>
            <given-names>Xiaoyi</given-names>
          </name>
          <degrees>MSc, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>INSERM U1138 - Team 22</institution>
            <institution>Information Sciences to Support Personalized Medicine</institution>
            <institution>Centre de Recherche des Cordeliers</institution>
            <addr-line>15 Rue de l'école de Médecine</addr-line>
            <addr-line>Esc D, 1e étage</addr-line>
            <addr-line>Paris, 75006</addr-line>
            <country>France</country>
            <phone>33 71196369</phone>
            <email>chenxiaoyi619@gmail.com</email>
          </address>
          <ext-link ext-link-type="orcid">http://orcid.org/0000-0002-7378-5158</ext-link>
        </contrib>
        <contrib contrib-type="author" id="contrib4">
          <name name-style="western">
            <surname>Deldossi</surname>
            <given-names>Myrtille</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">http://orcid.org/0000-0001-8268-3922</ext-link>
        </contrib>
        <contrib contrib-type="author" id="contrib5">
          <name name-style="western">
            <surname>Aboukhamis</surname>
            <given-names>Rim</given-names>
          </name>
          <degrees>M Pharm</degrees>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">http://orcid.org/0000-0003-3066-0125</ext-link>
        </contrib>
        <contrib contrib-type="author" id="contrib6">
          <name name-style="western">
            <surname>Faviez</surname>
            <given-names>Carole</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff5" ref-type="aff">5</xref>
          <ext-link ext-link-type="orcid">http://orcid.org/0000-0002-1500-0236</ext-link>
        </contrib>
        <contrib contrib-type="author" id="contrib7">
          <name name-style="western">
            <surname>Dahamna</surname>
            <given-names>Badisse</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff6" ref-type="aff">6</xref>
          <ext-link ext-link-type="orcid">http://orcid.org/0000-0003-0762-2518</ext-link>
        </contrib>
        <contrib contrib-type="author" id="contrib8">
          <name name-style="western">
            <surname>Karapetiantz</surname>
            <given-names>Pierre</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">http://orcid.org/0000-0001-6486-9838</ext-link>
        </contrib>
        <contrib contrib-type="author" id="contrib9">
          <name name-style="western">
            <surname>Guillemin-Lanne</surname>
            <given-names>Sylvie</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">http://orcid.org/0000-0003-3528-2514</ext-link>
        </contrib>
        <contrib contrib-type="author" id="contrib10">
          <name name-style="western">
            <surname>Lillo-Le Louët</surname>
            <given-names>Agnès</given-names>
          </name>
          <degrees>MD, Prof Dr</degrees>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">http://orcid.org/0000-0001-8135-7340</ext-link>
        </contrib>
        <contrib contrib-type="author" id="contrib11">
          <name name-style="western">
            <surname>Texier</surname>
            <given-names>Nathalie</given-names>
          </name>
          <degrees>M Pharm</degrees>
          <xref rid="aff5" ref-type="aff">5</xref>
          <ext-link ext-link-type="orcid">http://orcid.org/0000-0003-3749-254X</ext-link>
        </contrib>
        <contrib contrib-type="author" id="contrib12">
          <name name-style="western">
            <surname>Burgun</surname>
            <given-names>Anita</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <xref rid="aff7" ref-type="aff">7</xref>
          <ext-link ext-link-type="orcid">http://orcid.org/0000-0001-6855-4366</ext-link>
        </contrib>
        <contrib contrib-type="author" id="contrib13">
          <name name-style="western">
            <surname>Katsahian</surname>
            <given-names>Sandrine</given-names>
          </name>
          <degrees>MD, PhD, Prof Dr</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff7" ref-type="aff">7</xref>
          <xref rid="aff8" ref-type="aff">8</xref>
          <xref rid="aff9" ref-type="aff">9</xref>
          <ext-link ext-link-type="orcid">http://orcid.org/0000-0002-7261-0671</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
      <label>1</label>
      <institution>INSERM U1138 - Team 22</institution>
      <institution>Information Sciences to Support Personalized Medicine</institution>  
      <institution>Centre de Recherche des Cordeliers</institution>  
      <addr-line>Paris</addr-line>
      <country>France</country></aff>
      <aff id="aff2">
      <label>2</label>
      <institution>Département d'Informatique Médicale</institution>
      <institution>Hôpital Européen Georges-Pompidou</institution>  
      <institution>Assistance Publique - Hôpitaux de Paris</institution>  
      <addr-line>Paris</addr-line>
      <country>France</country></aff>
      <aff id="aff3">
      <label>3</label>
      <institution>Innovative Projects - Text Mining</institution>
      <institution>Expert System</institution>  
      <addr-line>Paris</addr-line>
      <country>France</country></aff>
      <aff id="aff4">
      <label>4</label>
      <institution>Centre Régional de Pharmacovigilance</institution>
      <institution>Hôpital Européen Georges-Pompidou</institution>  
      <institution>Assistance Publique - Hôpitaux de Paris</institution>  
      <addr-line>Paris</addr-line>
      <country>France</country></aff>
      <aff id="aff5">
        <label>5</label>
        <institution>Kappa Santé</institution>
        <addr-line>Paris</addr-line>
        <country>France</country>
      </aff>
      <aff id="aff6">
      <label>6</label>
      <institution>Service d'Informatique Biomédicale, D2IM</institution>
      <institution>Centre Hospitalier Universitaire de Rouen</institution>  
      <addr-line>Rouen</addr-line>
      <country>France</country></aff>
      <aff id="aff7">
      <label>7</label>
      <institution>INSERM U1138 - Team 22</institution>
      <institution>Information Sciences to Support Personalized Medicine</institution>  
      <institution>Paris Descartes University, Sorbonne Paris Cité</institution>  
      <addr-line>Paris</addr-line>
      <country>France</country></aff>
      <aff id="aff8">
      <label>8</label>
      <institution>Clinical Research Unit Hôpitaux Universitaires Paris Ouest</institution>
      <institution>Hôpital Européen Georges-Pompidou</institution>  
      <institution>Assistance Publique - Hôpitaux de Paris</institution>  
      <addr-line>Paris</addr-line>
      <country>France</country></aff>
      <aff id="aff9">
      <label>9</label>
      <institution>INSERM CIC1418</institution>
      <institution>Clinical Epidemiology</institution>  
      <institution>Hôpital Européen Georges-Pompidou</institution>  
      <addr-line>Paris</addr-line>
      <country>France</country></aff>
      <author-notes>
        <corresp>Corresponding Author: Xiaoyi Chen 
        <email>chenxiaoyi619@gmail.com</email></corresp>
      </author-notes>
      <pub-date pub-type="collection"><month>05</month><year>2019</year></pub-date>
      <pub-date pub-type="epub">
        <day>07</day>
        <month>05</month>
        <year>2019</year>
      </pub-date>
      <volume>8</volume>
      <issue>5</issue>
      <elocation-id>e11448</elocation-id>
      <!--history from ojs - api-xml-->
      <history>
        <date date-type="received">
          <day>29</day>
          <month>6</month>
          <year>2018</year>
        </date>
        <date date-type="rev-request">
          <day>1</day>
          <month>8</month>
          <year>2018</year>
        </date>
        <date date-type="rev-recd">
          <day>16</day>
          <month>11</month>
          <year>2018</year>
        </date>
        <date date-type="accepted">
          <day>21</day>
          <month>12</month>
          <year>2018</year>
        </date>
      </history>
      <copyright-statement>©Armelle Arnoux-Guenegou, Yannick Girardeau, Xiaoyi Chen, Myrtille Deldossi, Rim Aboukhamis, Carole Faviez, Badisse Dahamna, Pierre Karapetiantz, Sylvie Guillemin-Lanne, Agnès Lillo-Le Louët, Nathalie Texier, Anita Burgun, Sandrine Katsahian. Originally published in JMIR Research Protocols (http://www.researchprotocols.org), 07.05.2019.</copyright-statement>
      <copyright-year>2019</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Research Protocols, is properly cited. The complete bibliographic information, a link to the original publication on http://www.researchprotocols.org, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="http://www.researchprotocols.org/2019/5/e11448/" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Social media is a potential source of information on postmarketing drug safety surveillance that still remains unexploited nowadays. Information technology solutions aiming at extracting adverse reactions (ADRs) from posts on health forums require a rigorous evaluation methodology if their results are to be used to make decisions. First, a gold standard, consisting of manual annotations of the ADR by human experts from the corpus extracted from social media, must be implemented and its quality must be assessed. Second, as for clinical research protocols, the sample size must rely on statistical arguments. Finally, the extraction methods must target the relation between the drug and the disease (which might be either treated or caused by the drug) rather than simple co-occurrences in the posts.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>We propose a standardized protocol for the evaluation of a software extracting ADRs from the messages on health forums. The study is conducted as part of the Adverse Drug Reactions from Patient Reports in Social Media project.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>Messages from French health forums were extracted. Entity recognition was based on <italic>Racine Pharma</italic> lexicon for drugs and Medical Dictionary for Regulatory Activities terminology for potential adverse events (AEs). Natural language processing–based techniques automated the ADR information extraction (relation between the drug and AE entities). The corpus of evaluation was a random sample of the messages containing drugs and/or AE concepts corresponding to recent pharmacovigilance alerts. A total of 2 persons experienced in medical terminology manually annotated the corpus, thus creating the gold standard, according to an annotator guideline. We will evaluate our tool against the gold standard with recall, precision, and f-measure. Interannotator agreement, reflecting gold standard quality, will be evaluated with hierarchical kappa. Granularities in the terminologies will be further explored.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>Necessary and sufficient sample size was calculated to ensure statistical confidence in the assessed results. As we expected a global recall of 0.5, we needed at least 384 identified ADR concepts to obtain a 95% CI with a total width of 0.10 around 0.5. The automated ADR information extraction in the corpus for evaluation is already finished. The 2 annotators already completed the annotation process. The analysis of the performance of the ADR information extraction module as compared with gold standard is ongoing.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>This protocol is based on the standardized statistical methods from clinical research to create the corpus, thus ensuring the necessary statistical power of the assessed results. Such evaluation methodology is required to make the ADR information extraction software useful for postmarketing drug safety surveillance.</p>
        </sec>
        <sec sec-type="registered-report">
          <title>International Registered Report Identifier (IRRID)</title>
          <p>RR1-10.2196/11448</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>social media</kwd>
        <kwd>drug-related side effects and adverse reactions</kwd>
        <kwd>natural language processing</kwd>
        <kwd>data mining</kwd>
        <kwd>MedDRA</kwd>
        <kwd>Racine Pharma</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <sec>
        <title>Background</title>
        <p>The detection of new adverse drug reactions (ADRs) has been based on postmarketing surveillance by government agencies (national authorities) derived from spontaneous reporting by health care professionals and patients. The US Food and Drug Administration (FDA) and the European Medicines Agency collect ADR case reports through the FDA’s Adverse Event Reporting System (FAERS) [<xref ref-type="bibr" rid="ref1">1</xref>-<xref ref-type="bibr" rid="ref4">4</xref>] and the EudraVigilance system, respectively. These systems are useful tools for drug agencies, which mine these huge amounts of structured data to look for new safety concerns that might be related to a marketed product [<xref ref-type="bibr" rid="ref5">5</xref>-<xref ref-type="bibr" rid="ref8">8</xref>].</p>
        <p>In the last 20 years, internet and social media have become an integral part of people’s daily life. Social media is now often used to communicate with other persons having the same health concerns and share information regarding their health conditions, feelings, medications, and many other aspects [<xref ref-type="bibr" rid="ref9">9</xref>]. Social media is, therefore, a potential provider of information on ADRs. In 2005, the International Society of Drug Bulletins already recognized such a use: <italic>Patient reporting systems should periodically sample and evaluate the scattered drug experiences patients report on the internet</italic> [<xref ref-type="bibr" rid="ref10">10</xref>]. This new source of knowledge captured the interest from health informatics, statistics, and public health researchers. Although in its infancy, related scientific literature increased in the last decade [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref11">11</xref>-<xref ref-type="bibr" rid="ref13">13</xref>].</p>
      </sec>
      <sec>
        <title>Objectives</title>
        <p>In this context, the French Ministry of Industry funded and launched the Adverse Drug Reactions from Patient Reports in Social Media (ADR-PRISM) project. The objective of ADR-PRISM was to make available the contents about ADR, informal and embedded in forums and discussions on the Web, to the actors involved in drug safety (drug companies, agencies, and pharmacovigilance experts). In the end, the tool developed in the ADR-PRISM project should generate hypotheses about new or poorly documented adverse events (AEs). To reach its goals, the ADR-PRISM consortium gathers a company developing text mining softwares (Expert System), a company specialized in pharmaco-epidemiology (Kappa Santé), 3 academic research groups providing expertise in medical informatics and statistics (National Institute of Health and Medical Research &amp; Cordeliers Research Centre: umrs 1138 team 22 dedicated to Information Sciences to support Personalized Medicine and Laboratory in Medical Informatics and Knowledge Engineering in e-Health, and Biomedicine informatics, Service Catalogue and Index of French Language medical websites SIBM-CISMeF), 2 experts in pharmacovigilance (regional center of pharmacovigilance), as well as Vidal group that supplies the drug database used in most drug prescription systems in France.</p>
        <p>From a natural language processing (NLP) perspective, we considered ADR as relationships between drug and AE concepts. On the basis of that, the NLP-based Skill Cartridge for pharmacovigilance developed by Expert System for ADR-PRISM includes a relation extraction module based on (named) entity recognition combined with rules and regular expressions. Before applying it to large collections of forum discussions, we designed a protocol to assess the performance of this ADR information extraction module. The objective of this study is to present this protocol.</p>
      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Synopsis</title>
        <p>With the objective of sharing a methodology that guarantees the confidence in the results in ADR-PRISM, we followed a way of reasoning inspired by the standards widely adopted in clinical research such as the Standards for Reporting Diagnostic Accuracy studies [<xref ref-type="bibr" rid="ref14">14</xref>]. These items are displayed in <xref ref-type="boxed-text" rid="box1">Textbox 1</xref>.</p>
        <boxed-text id="box1" position="float">
          <title>Synopsis of the protocol.</title>
          <p>Rationale</p>
          <list list-type="bullet">
            <list-item>
              <p>Nowadays, patients extensively use social media. They report on the adverse events they feel because of their medications (further called adverse drug reaction [ADR]) on health forums. Promising studies exist on the extraction of ADR information from social media with natural language processing (NLP) or machine learning tools.</p>
            </list-item>
            <list-item>
              <p>The consortium Adverse Drug Reaction from Patient Reports in Social Media (ADR-PRISM) has been constituted to create a tool extracting the ADR information from social media. Teams specialized in text mining NLP and pharmacovigilance participate in the consortium.</p>
            </list-item>
            <list-item>
              <p>Before applying the ADR-PRISM’s tool on a larger scale (millions of posts) to draw conclusions on ADRs, our goal was to adapt the principles adopted in clinical research to assess the ADR-PRISM. For example, evaluation was done against a gold standard based on manual annotation of the posts.</p>
            </list-item>
          </list>
          <p>Primary objective</p>
          <list list-type="bullet">
            <list-item>
              <p>To estimate robustly the performance of the ADR information extraction tool against gold standard.</p>
            </list-item>
          </list>
          <p>Primary expected results</p>
          <list list-type="bullet">
            <list-item>
              <p>Precision, recall, and f-measure for ADR extraction.</p>
            </list-item>
          </list>
          <p>Secondary objectives</p>
          <list list-type="bullet">
            <list-item>
              <p>To verify the quality of the gold standard and to evaluate the impact of various conditions (eg, different granularities and sentence constraint of the tool) on the performance of the ADR information extraction tool.</p>
            </list-item>
          </list>
          <p>Secondary expected results</p>
          <list list-type="bullet">
            <list-item>
              <p>Kappa metrics for interannotator agreement; and precision, recall, and f-measure for ADR extraction in various conditions.</p>
            </list-item>
          </list>
          <p>Database</p>
          <list list-type="bullet">
            <list-item>
              <p>Posts from the Kappa Santé Detec’t database published between January 1, 2007, and October 28, 2016.</p>
            </list-item>
          </list>
          <p>Eligibility criteria</p>
          <list list-type="bullet">
            <list-item>
              <p>Posts from the Kappa Santé Detec’t database that contain at least one drug’s or molecule’s (active substance) name, and posts randomly selected from the rest of the Kappa Santé Detec’t database; a list of drugs and adverse events (AEs) of interest is established by drug safety experts; and ADR: any explicit and positive relationship between a drug and a potential AE where either the drug or the AE or both belong to the list.</p>
            </list-item>
          </list>
          <p>Index test method</p>
          <list list-type="bullet">
            <list-item>
              <p>ADR information extraction tool: this tool classifies each co-occurrence of drug and AE in a post as positive ADR or negative ADR or no ADR, and maps the drug and the AE expression to <italic>Racine Pharma</italic> and Medical Dictionary for Regulatory Activities (MedDRA), respectively.</p>
            </list-item>
          </list>
          <p>Reference method</p>
          <list list-type="bullet">
            <list-item>
              <p>Gold standard: manual annotations of the co-occurrence of drug and AE as positive ADR or negative ADR or no ADR including the mapping of the drug and the AE expression with a <italic>Racine Pharma</italic> and a MedDRA entity, respectively. Manual annotations will be provided by 2 annotators with experience in medical terminology.</p>
            </list-item>
          </list>
          <p>Sample size</p>
          <list list-type="bullet">
            <list-item>
              <p>A 95% CI, with a total width of 0.1, is used to determine the sample size.</p>
            </list-item>
          </list>
          <p>Statistical analyses</p>
          <list list-type="bullet">
            <list-item>
              <p>Recall, precision, and f-measure calculations for evaluation of the performances of the ADR extraction information tool and interannotator agreement for the evaluation of the gold standard with a Cohen kappa.</p>
            </list-item>
          </list>
        </boxed-text>
      </sec>
      <sec>
        <title>Design and Ethics</title>
        <sec>
          <title>Design</title>
          <p>This project is based on retrospective data collected among threads of discussion accessible on social media (messages from French health forums). A total of 2 experts in pharmacovigilance helped delineating the project. The objective is twofold: (1) focus on certain pharmaceutical products of interest and identify the related ADRs and (2) detect the emergence of general potential problem in public health. On this basis, the extraction of ADR information is expected to (1) perform well on specific concepts for use case study and (2) be able to extract all potential concepts correctly for screening purpose.</p>
          <p>To evaluate the ADR information extraction, we therefore build up the global process in 2 phases (<xref ref-type="fig" rid="figure1">Figure 1</xref>). In phase 1, we implemented an iterative process of validation and improvement of the Skill Cartridge for pharmacovigilance. The objectives were (1) to correct the most frequent errors and to train the ADR information extraction module and (2) to estimate the performance indicators and the time required for manual annotation for phase 2 sample size determination. Then, in phase 2, we will conduct a definite assessment of the performance of the ADR information extraction module.</p>
          <p>In the rest of the paper, we use the term <italic>AE</italic> for medical events that are present in text for a potential ADR, whereas the term <italic>ADR</italic> is used when a relation between a drug and an AE is established.</p>
          <fig id="figure1" position="float">
            <label>Figure 1</label>
            <caption>
              <p>Study overview. ADR: adverse drug reaction.</p>
            </caption>
            <graphic xlink:href="resprot_v8i5e11448_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
        <sec>
          <title>Ethics</title>
          <p>This research did not involve experiment on either humans or animals. Ethics and guarantee of data privacy constituted an integral and dedicated working group set up for the ADR-PRISM project. To comply with national regulations, we first registered data collection to the French Data Protection Agency (CNIL for Commission Nationale Informatique et Liberté), which is known as a <italic>normal notification</italic> in technical terminology, on December 23, 2015. We later submitted an authorization request on March 30, 2016, regarding data analysis and validation of the approach adopted about ethics and confidentiality to the same agency. ADR-PRISM’s consortium detailed approach is explained in the study by Bousquet et al [<xref ref-type="bibr" rid="ref15">15</xref>].</p>
          <p>The ADR-PRISM project was supported by an ethics advisory board, which was composed of scientists with different scientific expertise: drug safety, public health, and ethics. Their role was to give independent advice regarding ethical issues to the project consortium. The board approved the whole study design, including the protocol presented in the paper.</p>
        </sec>
      </sec>
      <sec>
        <title>Adverse Drug Reactions From Patient Reports in Social Media Adverse Drug Reaction Extraction</title>
        <sec>
          <title>Resources</title>
          <p>We used 3 lexicons to represent drug information and AEs. We codified AEs with the Medical Dictionary for Regulatory Activities (MedDRA) v15.1 [<xref ref-type="bibr" rid="ref16">16</xref>] classification. <italic>Racine Pharma</italic>, maintained by the SIBM-CISMeF [<xref ref-type="bibr" rid="ref17">17</xref>], provided an extensive source of drug names that covered all medications available on the French market, including brand names and active ingredients. <italic>Racine Pharma</italic> entries were mapped to the Anatomical Therapeutic Chemical (ATC) system [<xref ref-type="bibr" rid="ref18">18</xref>], which was used as a classification system for drugs.</p>
          <p>The corpus of messages was extracted from the Detec’t database [<xref ref-type="bibr" rid="ref19">19</xref>], a database developed by Kappa Santé that collects messages from several French forums using a Web crawler. We limited ourselves to a list of 5 major health forums in French obtained using netscoring [<xref ref-type="bibr" rid="ref9">9</xref>]. Message extraction was based on a named entity recognition module using a drug lexicon designed by Kappa Santé and a fuzzy matching algorithm. The lexicon was based on <italic>Racine Pharma</italic>, the ATC classification, and a list of medications extracted from the French National Health Insurance database.</p>
        </sec>
      </sec>
      <sec>
        <title>Drugs, Adverse Events, and Adverse Drug Reaction Extraction</title>
        <p>ADR extraction was performed in 2 steps: first, named entity recognition modules were used to identify drug names and AEs in posts, and then, a relation extraction algorithm was applied to these entities (<xref ref-type="fig" rid="figure2">Figure 2</xref>).</p>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Adverse drug reaction pipeline. ADR: adverse drug reaction; ATC: Anatomical Therapeutic Chemical (in ATC classification); MedDRA: Medical Dictionary for Regulatory Activities.</p>
          </caption>
          <graphic xlink:href="resprot_v8i5e11448_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <sec>
          <title>Drugs and Adverse Events Extraction</title>
          <p>Regarding drugs, Expert System has developed a named entity recognition module capable of identifying words or tokens (occurrences) listed in <italic>Racine Pharma</italic> and extracting their positions from forum posts.</p>
          <p>We mapped the extracted expressions from <italic>Racine Pharma</italic> to the chemical substance level (5th level) of the ATC (last updated version: December 19, 2016) [<xref ref-type="bibr" rid="ref18">18</xref>]. Considering that the same active ingredient could be found under different trade names, we pooled all mapped expressions within the same ATC chemical subgroup (4th level) to define the drug concepts.</p>
          <p>Expert System has developed another module based on MedDRA to identify the AEs and extract their position in the posts. Fuzzy-matching and enrichment of thesaurus with colloquial terms enabled to take into account the characteristics of the posts on health forums.</p>
        </sec>
        <sec>
          <title>Drug and Adverse Event Relationship Extraction (Skill Cartridge for Pharmacovigilance)</title>
          <p>An NLP module has been developed by Expert System to capture the specific information regarding the relationship established between a drug and an AE by the post’s author. The module combined a set of rules and regular expressions, with a <italic>Patient</italic> lexicon constituted to ensure that the post’s author set out a situation of a person taking the drug and experiencing the symptom and excludes general information regarding a drug or an AE. This lexicon contains terms such as <italic>I</italic>, <italic>me</italic>, <italic>my</italic>, <italic>cause</italic>, <italic>test</italic>, <italic>take</italic>, <italic>feeling</italic>, <italic>because of</italic>, <italic>provoke</italic>, <italic>intolerance</italic>, and <italic>allergies</italic>. This NLP module also included negation detection.</p>
          <p>The algorithm can be summarized as follows:</p>
          <list list-type="order">
            <list-item>
              <p>Text was split into sentences based on the punctuation mark.</p>
            </list-item>
            <list-item>
              <p>For each sentence, (named) entity recognition modules extracted drugs and AEs.</p>
            </list-item>
            <list-item>
              <p>For each pair of drug and AE co-occurring in a sentence, if the NLP module extracted specific information regarding a relation, then the co-occurrence was classified as follows:</p>
              <list list-type="bullet">
                <list-item>
                  <p>Explicit and positive ADR (eg, <italic>Abilify causes me such fears that I cannot concentrate to read, work, etc</italic>...);</p>
                </list-item>
                <list-item>
                  <p>Explicit and negative ADR (eg, <italic>I took some Doliprane and I didn’t feel any nausea);</italic></p>
                </list-item>
                <list-item>
                  <p>If no specific information was identified, the co-occurrence was classified as no ADR (eg, <italic>Usually, Focalin’s adverse effects are loss of appetite, insomnia, and naso-pharyngitis</italic>).</p>
                </list-item>
              </list>
            </list-item>
          </list>
        </sec>
      </sec>
      <sec>
        <title>Phase 1: Iterative Improvement of the Adverse Drug Reaction Information Extraction Module</title>
        <p>Phase 1 consisted of an iterative process of validations and improvements of the tool. The review on the corpus was constituted by manual annotation of the messages by 2 experts in pharmacovigilance. The manual annotation process used a tool developed by Expert System for in-house testing purposes [<xref ref-type="bibr" rid="ref20">20</xref>]. This tool did not integrate functionalities for blind manual annotation. No gold standard was established at this step. All along the process, both annotators could see the drugs, AEs, and ADRs extracted by the tool, and their task consisted of validating or invalidating these extractions and, if needed, complementing the annotations performed by the system. The annotators were asked to (1) check all drugs and all AEs in the post, irrespective of whether they have been involved in an ADR relationship, and (2) identify all drug-AE relationships in the same sentence. The output of phase 1 was a first estimation of precision, recall, and f-measure, assessing the capacity to extract information regarding drugs, AEs, and ADRs. More details about the corpus construction, evaluating concept selection, sample size determination, and the preliminary results of this phase were reported in the study by Chen et al [<xref ref-type="bibr" rid="ref21">21</xref>].</p>
      </sec>
      <sec>
        <title>Phase 2: Evaluation</title>
        <sec>
          <title>Corpus for Evaluation</title>
          <sec>
            <title>Evaluation Dataset</title>
            <p>For phase 2, the selection of datasets is given in <xref ref-type="fig" rid="figure3">Figure 3</xref>.</p>
            <p>On October 28, 2016, Kappa Santé Detec’t database contained about 23 millions of posts, and approximately 21 million posts were published after January 1, 2007. Messages about drugs, for which marketing authorization has been withdrawn before the cut-off date, were considered as some AEs might appear at long term or patients might discuss about old drugs and their safety.</p>
            <p>The software developed by Kappa Santé for purpose of Web discussions collection offered the possibility of preidentifying the posts containing at least one pharmaceutical or molecule name. We considered the dataset of all posts containing at least one preidentified compound or brand name and combined it with a complementary set of posts randomly sampled from the remainder of the Kappa Santé Detec’t database.</p>
            <p>The drug, AE, and ADR extraction modules developed for ADR-PRISM were executed on both sets of posts, and the output of the extraction module was considered as the evaluation dataset.</p>
            <fig id="figure3" position="float">
              <label>Figure 3</label>
              <caption>
                <p>Phase 2 messages selection flowchart. ADR: adverse drug reaction; ATC: Anatomical Therapeutic Chemical (in ATC classification); MedDRA: Medical Dictionary for Regulatory Activities.</p>
              </caption>
              <graphic xlink:href="resprot_v8i5e11448_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
            </fig>
          </sec>
          <sec>
            <title>Drug Selection</title>
            <p>The evaluation focused on 3 categories of drugs: (1) the most frequently extracted drugs in the corpus, (2) the most sold drugs in France, and (3) the drugs of interest of pharmacovigilance because of recent safety alerts. For the last 2 categories, the frequencies of the recognized named entities were also taken into account to cope with the necessary sample size.</p>
            <p>The most sold drugs in 2013 in France are listed below, in their French commercial names, including the 10 most sold drugs with <italic>mandatory</italic> medical prescription for dispensation and the 10 most sold drugs with <italic>optional</italic> medical prescription for dispensation [<xref ref-type="bibr" rid="ref22">22</xref>]:</p>
            <list list-type="bullet">
              <list-item>
                <p><italic>Mandatory medical prescription for dispensation:</italic> Levothyrox, Uvedose, Lamaline, Dafalgan codéiné, Méthadone, Crestor, Pivalone, Seresta, Emla patch, and Seroplex</p>
              </list-item>
              <list-item>
                <p><italic>Optional medical prescription for dispensation:</italic> Doliprane, Dafalgan, Efferalgan, Kardégic, Spasfon, Gaviscon, Dexéryl, Météospasmyl, Biseptine, and Eludril.</p>
              </list-item>
            </list>
            <p>The 2 experts additionally worked out a list of pairs of 1 drug concept and 1 AE concept corresponding to alerts that emerged in the last years (<xref ref-type="table" rid="table1">Table 1</xref>). This list of use cases has been further employed as a basis for the concept selection for evaluation. The concept selection in phase 1 (iterative improvement) [<xref ref-type="bibr" rid="ref21">21</xref>] was based on the same consideration; therefore, those concepts on which the extraction tool performed well should be excluded from the selection for evaluation.</p>
            <table-wrap position="float" id="table1">
              <label>Table 1</label>
              <caption>
                <p>List of drug and adverse event concepts selected as pharmacovigilance use cases.</p>
              </caption>
              <table width="1000" cellpadding="7" cellspacing="0" border="1" rules="groups" frame="hsides">
                <col width="280"/>
                <col width="280"/>
                <col width="280"/>
                <col width="160"/>
                <thead>
                  <tr valign="top">
                    <td>Active drug ingredient: French names (date of marketing in cases where drug has been withdrawn)</td>
                    <td>Adverse events of interest</td>
                    <td>Corresponding Medical Dictionary for Regulatory Activities term</td>
                    <td>Media coverage or alert date</td>
                  </tr>
                </thead>
                <tbody>
                  <tr valign="top">
                    <td>Gardasil</td>
                    <td>Autoimmune disease, complex regional pain syndrome, and postural orthostatic tachycardia syndrome</td>
                    <td>Autoimmune disorders (HLGT<sup>a</sup>) + complex regional pain syndrome (PT<sup>b</sup>) + postural orthostatic tachycardia syndrome (PT)</td>
                    <td>2013</td>
                  </tr>
                  <tr valign="top">
                    <td>Meningitec</td>
                    <td>Quality defect and any adverse event</td>
                    <td>All terms</td>
                    <td>2015</td>
                  </tr>
                  <tr valign="top">
                    <td>Methylphénidate: Ritaline, Concerta, Medikinet, Quasym, and Ritaline</td>
                    <td>Neurological and cardiac effects</td>
                    <td>Cardiac disorders (SOC<sup>c</sup>) + nervous system disorders (SOC)</td>
                    <td>2009 (recommendation)</td>
                  </tr>
                  <tr valign="top">
                    <td>Acétate de cyprotérone: Diane 35, Cypropharm (2010-2013), Elleacnelle (2010-2013), Evepar, Holgyme (2002-2015), Lumalia (2003-2013), Minerva, and Arielle (1997-2011)</td>
                    <td>Thromboembolic risk</td>
                    <td>Embolism and thrombosis (HLGT)</td>
                    <td>2012 (alert)</td>
                  </tr>
                  <tr valign="top">
                    <td>Fluoxétine: Prozac, Elindra (2001-2008), Fluctine (1998-2008), and Fontex (2001-2008)</td>
                    <td>All adverse events</td>
                    <td>All terms</td>
                    <td>Mostly 2013</td>
                  </tr>
                  <tr valign="top">
                    <td>Méthadone</td>
                    <td>Prolonged time from the start of the Q wave to the end of the T wave during electrocardiogram (approximates the time taken from when the cardiac ventricles start to contract to when they finish relaxing)</td>
                    <td>QT interval prolongation</td>
                    <td>2007</td>
                  </tr>
                  <tr valign="top">
                    <td>Sofosbuvir: Harvoni, Epclusa, and Sovaldi</td>
                    <td>Bradycardia</td>
                    <td>Bradycardia (PT)</td>
                    <td>2013</td>
                  </tr>
                  <tr valign="top">
                    <td>Codeine: Codenfan, Codoliporane, Migralgine, and Néocodion et Prontalgine</td>
                    <td>Respiratory disorders</td>
                    <td>Respiratory disorders (HLGT)</td>
                    <td>2012 re-evaluation</td>
                  </tr>
                  <tr valign="top">
                    <td>Hydroxyzine: atarax</td>
                    <td>Rhythm disorders</td>
                    <td>Cardiac arrhythmias (HLGT)</td>
                    <td>2014</td>
                  </tr>
                  <tr valign="top">
                    <td>Nicorandil: Adancor and Ikorel</td>
                    <td>Skin ulceration</td>
                    <td>Skin ulcer (HLT<sup>d</sup>)</td>
                    <td>2012</td>
                  </tr>
                  <tr valign="top">
                    <td>Midodrine: Gutron</td>
                    <td>Hypertension</td>
                    <td>Blood pressure increased (PT)</td>
                    <td>2013</td>
                  </tr>
                  <tr valign="top">
                    <td>Galantamine: Reminyl, Galanthen (2012-2015), and Galema (2011-2015)</td>
                    <td>Skin reaction</td>
                    <td>Skin and subcutaneous tissue disorders (SOC)</td>
                    <td>2014</td>
                  </tr>
                  <tr valign="top">
                    <td>Crizotinib: Xalkori</td>
                    <td>Heart failure</td>
                    <td>Heart failures HLGT</td>
                    <td>2014</td>
                  </tr>
                  <tr valign="top">
                    <td>Valproate de sodium: Depakine, Imaslav, and Micropakine</td>
                    <td>Teratogenic effects</td>
                    <td>Congenital, familial, and genetic disorders (SOC)</td>
                    <td>2012?</td>
                  </tr>
                  <tr valign="top">
                    <td>Isotrétinoine: Curacné, Acnetrait, Contracné, Procuta, and Roaccutane</td>
                    <td>Teratogenic effects + psychiatric disorders</td>
                    <td>Congenital, familial, and genetic disorders (SOC) and psychiatric disorders (SOC)</td>
                    <td>2002</td>
                  </tr>
                  <tr valign="top">
                    <td>Fingolimod: Gilenya</td>
                    <td>Leukoencephalopathy</td>
                    <td>Toxic leukoencephalopathy (PT)</td>
                    <td>2014</td>
                  </tr>
                  <tr valign="top">
                    <td>Aripiprazole: Abilify</td>
                    <td>Suicidal behavior</td>
                    <td>Suicidal and self-injurious behavior (HLGT)</td>
                    <td>2013 (words of warning: 2016)</td>
                  </tr>
                </tbody>
              </table>
              <table-wrap-foot>
                <fn id="table1fn1">
                  <p><sup>a</sup>HLGT: high-level group term.</p>
                </fn>
                <fn id="table1fn2">
                  <p><sup>b</sup>PT: preferred term.</p>
                </fn>
                <fn id="table1fn3">
                  <p><sup>c</sup>SOC: system organ class.</p>
                </fn>
                <fn id="table1fn4">
                  <p><sup>d</sup>HLT: high-level term.</p>
                </fn>
              </table-wrap-foot>
            </table-wrap>
          </sec>
          <sec>
            <title>Adverse Event Concepts Selection</title>
            <p>The AE concepts for evaluation corresponded to preferred term (PT) level in the MedDRA hierarchy, and we focused similarly on 2 categories: (1) the most frequent extracted PTs and (2) the PTs of interest of pharmacovigilance (<xref ref-type="table" rid="table1">Table 1</xref>), guided also by the frequencies of the recognized entities in the corpus to cope with the necessary sample size.</p>
          </sec>
          <sec>
            <title>Adverse Drug Reaction Definition</title>
            <p>We defined an ADR as any explicit and positive relationship between a drug and an AE where the drug (respectively the AE) belonged to the list of concepts previously selected.</p>
          </sec>
          <sec>
            <title>Corpus for the Evaluation (Random Sample From Evaluation Dataset)</title>
            <p>Finally, a random sample from the evaluation dataset (ie, among all the ADR extracted by the ADR information extraction module) constituted our corpus for evaluation.</p>
          </sec>
        </sec>
      </sec>
      <sec>
        <title>Gold Standard</title>
        <sec>
          <title>Adverse Drug Reactions From Patient Reports in Social Media Manual Annotation Platform</title>
          <p>We developed a Web application dedicated to manual annotations valuable as gold standard, for the project purposes in phase 2.</p>
          <p>This application was based on Java Servlets and JavaScript libraries and connected in Java Database Connectivity to the dataset of posts selected for the gold standard annotation. We used a self-completion mechanism to attach portions of message to <italic>Racine Pharma</italic> and MedDRA terms. We used drag-and-drop operations to fill in a table containing the manual review of the co-occurrences, where each line was dedicated to 1 co-occurrence. For each co-occurrence, the drug and the AE were dragged-and-dropped in the first and the second column, respectively. In the third column, the manual annotator was given a drop-down menu that presented 3 possibilities for defining the co-occurrence: explicit positive ADR, explicit negative ADR, or no ADR. We finally offered the possibility to export this table containing the manual annotations obtained via the application. The interface of this application is shown in <xref ref-type="fig" rid="figure4">Figure 4</xref>.</p>
          <fig id="figure4" position="float">
            <label>Figure 4</label>
            <caption>
              <p>Interface of the manual annotation platform. ID: identifier; MedDRA: Medical Dictionary for Regulatory Activities.</p>
            </caption>
            <graphic xlink:href="resprot_v8i5e11448_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
        <sec>
          <title>Gold Standard Construction</title>
          <p>An annotator guideline has been established to standardize manual annotations. A total of 2 experts in medical terminologies have annotated all ADR relationships for each post in the evaluation corpus, and then, the manual annotation was considered as gold standard. Different from phase 1, here we expected that the annotators annotated all causal relationships between a drug and an AE, even if the drug and AE were not in the same sentence, which will allow us further evaluate the impact of the sentence boundary constraint of the extraction tool.</p>
          <p>Each annotator annotated 55.1% (261/474) of the posts in the evaluation corpus; thus, a subset of 10.1% (48/474) of the posts was annotated by both of them. The interannotator agreement could be assessed on these double-annotated posts. In case of disagreements, the 2 annotators discussed to achieve a consensus. If a lot of disagreements had occurred, the annotators would have been asked to learn again the guideline and revise their annotations. All along the process, both annotators were double-blinded: first, from the ADRs identified by the ADR information extraction module, and second, from the other annotator’s annotations.</p>
        </sec>
      </sec>
      <sec>
        <title>Statistical Analyses</title>
        <sec>
          <title>Primary Analysis</title>
          <p>To assess the efficacy of the ADR information extraction module as compared with the gold standard, we will globally calculate the recall, precision, and f-measure.</p>
          <p>In a post, if the ADR information extraction module identifies the same expression from <italic>Racine Pharma</italic> at the same position; <italic>and</italic> the same AE expression at PT level from MedDRA hierarchy at the same position; <italic>and</italic> the same type of relationship, as did the gold standard, then we will count the extracted <italic>ADR</italic> as a true positive (<xref ref-type="fig" rid="figure5">Figure 5</xref>).</p>
          <fig id="figure5" position="float">
            <label>Figure 5</label>
            <caption>
              <p>Recall, precision, and f-measure definitions. ADR: adverse drug reaction; ADR-PRISM: Adverse Drug Reaction from Patient Reports in Social Media; FN: false negative, manually annotated ADR by the gold standard that is not extracted by the ADR information extraction tool; FP: false positive, positive explicit relationship extracted by the ADR information extraction tool that is not manually annotated by gold standard; TN: true negative; TP: true positive.</p>
            </caption>
            <graphic xlink:href="resprot_v8i5e11448_fig5.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
        <sec>
          <title>F-Measure Gold Standard’s Evaluation</title>
          <p>The interannotator agreement will be assessed by a hierarchical Kappa [<xref ref-type="bibr" rid="ref23">23</xref>]. A hierarchical Kappa will enable to take into account the situation where the 2 annotators will disagree in either the level or the expression in ATC or MedDRA terminologies but will agree on higher levels than the annotated ones. Separate calculations for interannotator agreements by hierarchical Kappa on drug and AE expressions will be provided as well.</p>
        </sec>
        <sec>
          <title>Secondary Analyses</title>
          <p>We will complete these principal results with the following analyses.</p>
          <p>We will take into account MedDRA and ATC granularities by reproducing precision, recall, and f-measure at each level of the hierarchies (system organ class [SOC], high-level group term [HLGT], high-level term [HLT], and preferred term [PT] of MedDRA and anatomical main group, therapeutic subgroup, pharmacological subgroup, and chemical subgroup of ATC).</p>
          <p>We will provide a relaxed definition of true-positive ADRs combining the following 3 conditions: (1) the positions in the post of the extracted expressions for drug and AE both match the positions of the drug and AE expressions manually annotated, (2) the extracted and the manually annotated expressions for AE from MedDRA hierarchy are found in the same SOC levels, and (3) the classification of the identified relationship match the classification of the manually annotated relationship. We will calculate recall, precision, and f-measure with this definition for ADRs, drug, and AE identification separately.</p>
          <p>We will provide a global estimation of the performance of ADR information extraction module by taking into account other types of messages. These messages are those without information on at least one ADR concept, that is, messages in which (1) ADR information is extracted but is not concerned by the drug- or AE-selected concepts, (2) no ADR information is extracted but only co-occurrences of information about 1 drug and 1 AE, (3) only AE information is extracted, (4) only drug information is extracted, and (5) neither drug nor AE information is extracted. After having sampled each type of message described above, we will then calculate global recall or precision or f-measure on all types of messages by marginal calibration.</p>
          <p>All analyses will be performed in <italic>R</italic> software [<xref ref-type="bibr" rid="ref24">24</xref>].</p>
        </sec>
      </sec>
      <sec>
        <title>Sample Size Calculation</title>
        <p>Recall can be estimated from a random sample of ADR concepts annotated by the gold standard, whereas precision can be estimated from a random sample of ADR concepts extracted by the ADR information extraction module. However, creating the gold standard on the whole evaluation dataset before sampling in it for the recall was an overwhelming task. At the same time, a vast majority of messages did not contain any information on the drug concept. Thus, we expected a very low proportion of ADR concepts identified by the ADR information extraction module in the evaluation dataset. Therefore, the recall estimated from a random sample of ADR concepts annotated by the gold standard was mathematically approximated by the recall estimated on ADR concepts sampled for the precision.</p>
        <p>The sample size required for different expected precision or recall is provided in <xref ref-type="table" rid="table2">Table 2</xref>. By hypothesizing a global recall of 0.5, we needed at least 384 identified ADR concepts to obtain a 95% CI, having a total width of 0.1. The final determination of sample size was based on the previously estimated precision and recall.</p>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Sample size required according to the expected precision and recall and total width of confidence intervals (CIs).</p>
          </caption>
          <table width="1000" cellpadding="7" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="190"/>
            <col width="90"/>
            <col width="90"/>
            <col width="90"/>
            <col width="90"/>
            <col width="90"/>
            <col width="90"/>
            <col width="90"/>
            <col width="90"/>
            <col width="90"/>
            <thead>
              <tr valign="top">
                <td>Range of CI</td>
                <td colspan="9">Expected precision or recall values</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>0.1</td>
                <td>0.2</td>
                <td>0.3</td>
                <td>0.4</td>
                <td>0.5</td>
                <td>0.6</td>
                <td>0.7</td>
                <td>0.8</td>
                <td>0.9</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>90% CI</td>
                <td>35</td>
                <td>61</td>
                <td>81</td>
                <td>92</td>
                <td>96</td>
                <td>92</td>
                <td>81</td>
                <td>61</td>
                <td>35</td>
              </tr>
              <tr valign="top">
                <td>95% CI</td>
                <td>138</td>
                <td>246</td>
                <td>323</td>
                <td>369</td>
                <td>384</td>
                <td>369</td>
                <td>323</td>
                <td>246</td>
                <td>138</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
      </sec>
      <sec>
        <title>Differences Between Phase 1 and Phase 2</title>
        <p>The main differences between phase 1 and phase 2 are threefold (<xref ref-type="table" rid="table3">Table 3</xref>). First, in phase 1, the annotations targeted all drugs and AEs even if not involved in an ADR relation, whereas in phase 2, annotation focuses on the ADR relations. Second, in phase 2 (and only in phase 2) a gold standard based on blind manual annotation by 2 experts in medical terminologies was established and the interannotator agreement was measured. In contrast, the manual annotations of phase 1 were not blind, and most of the work consisted of validating the automatic annotations; thus, the interannotator agreement was not addressed. Finally, in phase 2, additional parameters such as the granularity and the segmentation of the messages (sentence boundaries) will be analyzed. The precision, recall, and f-measure will be calculated with a gold standard at the message level and might be compared with precisions, recalls and f-measures calculated at the sentence level and for all MedDRA and ATC granularities.</p>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Common features and differences between phase 1 and phase 2.</p>
          </caption>
          <table width="1000" cellpadding="7" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="300"/>
            <col width="350"/>
            <col width="350"/>
            <thead>
              <tr valign="top">
                <td>Issues</td>
                <td>Phase 1</td>
                <td>Phase 2</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Evaluation focus</td>
                <td>Drugs and adverse events entity recognition</td>
                <td>Adverse drug reaction relationships recognition</td>
              </tr>
              <tr valign="top">
                <td>Gold standard (manual annotations)</td>
                <td>Not blind</td>
                <td>Blind</td>
              </tr>
              <tr valign="top">
                <td>Gold standard annotators</td>
                <td>Pharmacovigilance experts</td>
                <td>Experts in medical terminologies</td>
              </tr>
              <tr valign="top">
                <td>Interannotator agreement</td>
                <td>No</td>
                <td>Yes</td>
              </tr>
              <tr valign="top">
                <td>Granularity issue</td>
                <td>No</td>
                <td>Yes</td>
              </tr>
              <tr valign="top">
                <td>Sentence boundary issue</td>
                <td>No</td>
                <td>Yes</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <p>At the time of publishing this evaluation protocol, several steps of this project would have been completed. The corpus for evaluation has been constituted, and the NLP tools have identified and extracted the information about ADR inside this corpus. We selected the ADR concepts and constituted the samples of the entities necessary to set up the gold standard. The 2 annotators completed the annotations process.</p>
      <p>Data analyses for assessing the interannotator agreement and the performance of the ADR information extraction module as compared with the gold standard are ongoing, and the study results are expected internally before the end of 2018.</p>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Summary</title>
        <p>With the objective of using messages on health forums as a new source for drug safety, the systems developed to mine the messages must follow strict evaluation rules. This is even more important as these systems might be used to support decision making. The protocol presented in this paper has been designed to evaluate the ADR information extraction Skill Cartridge developed in ADR-PRISM in a pharmacovigilance perspective.</p>
      </sec>
      <sec>
        <title>Study Strengths</title>
        <p>The protocol presented in this paper is an attempt to apply clinical research–level guidelines [<xref ref-type="bibr" rid="ref14">14</xref>] to the assessment of such systems.</p>
        <p>First, we paid particular attention to the establishment and the validation of the gold standard. The gold standard was established by 2 trained specialists of medical terminologies who annotated selected messages. Manual annotation was performed in a <italic>double-blind</italic> manner, namely, from both the other annotator and the ADR identified by the ADR information extraction module. The annotated corpus, therefore, constituted a valuable gold standard. On the basis of the study by Sarker et al [<xref ref-type="bibr" rid="ref4">4</xref>] (see <xref ref-type="app" rid="app1">Multimedia Appendix 1</xref>), we could find 13 studies where a gold standard, that is, manual annotations used for evaluation, was implemented [<xref ref-type="bibr" rid="ref25">25</xref>-<xref ref-type="bibr" rid="ref37">37</xref>]. Conversely, in 8 studies, there was no gold standard [<xref ref-type="bibr" rid="ref38">38</xref>-<xref ref-type="bibr" rid="ref45">45</xref>], and the extracted ADRs were compared with already known AEs from FAERS [<xref ref-type="bibr" rid="ref39">39</xref>-<xref ref-type="bibr" rid="ref41">41</xref>,<xref ref-type="bibr" rid="ref43">43</xref>,<xref ref-type="bibr" rid="ref44">44</xref>] or drug label declared to FDA [<xref ref-type="bibr" rid="ref38">38</xref>,<xref ref-type="bibr" rid="ref45">45</xref>] or even AE described in websites [<xref ref-type="bibr" rid="ref42">42</xref>]. Moreover, in the ADR-PRISM protocol, a common subset of randomly selected messages was annotated in a blind manner by the 2 experts; interannotator agreement evaluation will also ensure ourselves about the quality of this gold standard. In most of studies, the authors gauged the interannotators agreement [<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref30">30</xref>-<xref ref-type="bibr" rid="ref32">32</xref>,<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref35">35</xref>]. However, it is not systematic [<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref37">37</xref>].</p>
        <p>Second, by calculating a sample size of messages collected from social media, to assess recall, precision, and f-measure, we guaranteed the statistical power to place reliance on our study results.</p>
        <p>The chosen terminologies are another crucial aspect of this work. On the one hand, the <italic>Racine Pharma</italic> thesaurus, with 5164 entries, exhaustively covers a large range of drug names and active ingredients. On the other hand, the MedDRA hierarchy is used daily by drug safety experts and considered expressive for this task. By using these terminologies, we expect to increase the sensitivity of the ADR-PRISM Skill Cartridge for pharmacovigilance. Our choice to map <italic>Racine Pharma</italic> to ATC was guided by 2 aspects. First, ATC like MedDRA has a hierarchical structure. Thus, we will be able to evaluate the ADR information extraction tool based on different hierarchical levels of these terminologies. Second, ATC and MedDRA are widely used and internationally agreed reference terminologies. Hence, we expect to provide strong and reproducible results.</p>
        <p>The ADR information extraction module was not only based on drug and AE information identification but also on rules and regular expressions. As such, we expect to discard noninformative sentences, addressing general information about the drug or drug indications. We would also be able to identify unexpected <italic>positive</italic> effects, as for example, headaches that would be reduced by a drug without indication for the treatment of this kind of pain. Only few studies have been able to take this aspect into account [<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref30">30</xref>,<xref ref-type="bibr" rid="ref32">32</xref>,<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref46">46</xref>].</p>
      </sec>
      <sec>
        <title>Study Limitations</title>
        <p>Despite its positive aspects, the study exhibits several limitations.</p>
        <p>The mapping between the terms listed in the drug thesaurus <italic>Racine Pharma</italic> and the terms referenced in the chemical substance in the ATC hierarchy was incomplete. Among the 5164 terms in <italic>Racine Pharma</italic>, 852 (16.5%, 852/5164) could not be mapped to ATC, for example, some phytotherapies (St John’s wort herbal tea, Silver birch juice, extract of licorice root, arum triphyllum compound, arnica, etc). This could have a negative impact on the recall scores calculated according to the ATC levels.</p>
        <p>In social media’ posts, slangs and colloquial languages are frequent; likewise, syntactic rules are approximate. We chose to use fuzzy-matching and thesaurus enrichment to take into account this bias. However, this approach is inherently nonexhaustive with negative impact on the recall of the ADR information extraction module.</p>
        <p>Regarding the gold standard, 2 experts in medical terminologies trained in drug safety performed manual annotations. However, contrary to the phase 1 manual review, none of them could be considered as a pharmacovigilance expert.</p>
        <p>The medical informatics community needs shared open corpora to evaluate their methods and tools. Recent efforts have led to making several datasets more accessible and the evaluation of the methods more standardized, for example, the Multiparameter Intelligent Monitoring in Intensive Care corpus [<xref ref-type="bibr" rid="ref47">47</xref>] and the Informatics for Integrating Biology and the Bedside challenges [<xref ref-type="bibr" rid="ref48">48</xref>]. Drug safety could benefit from open-access validation datasets made available for research purposes [<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref35">35</xref>]. However, several obstacles remain. For example, the ADR-PRISM consortium got approval to reuse posts for research purposes, but the approval is restricted to the project.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>The objective of this study is to present the scientific approach developed in the first stage of the ADR-PRISM project. At this stage, our principal objective was to evaluate the performance of the ADR information extraction Skill Cartridge against a gold standard constituted by human annotations. To address this question, our goal was to adapt the principles adopted in clinical research to assess sound and trustworthy measurements of precision, recall, and f-measure.</p>
        <p>With the statistical theory, we calculated a sample size. This guaranteed enough ADR information and sufficient narrowness of the confidence interval, to scientifically conclude on our principal objective. We also avoided unnecessarily large extractions for which the process of manual annotations is nothing but both wasteful and time-consuming.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <app id="app1">
        <title>Multimedia Appendix 1</title>
        <p>Designs of articles related to ADR information extraction on social media (replicated from Sarker et al).</p>
        <media xlink:href="resprot_v8i5e11448_app1.pdf" xlink:title="PDF File (Adobe PDF File), 94KB"/>
      </app>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">ADR</term>
          <def>
            <p>adverse drug reaction</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">ADR-PRISM</term>
          <def>
            <p>Adverse Drug Reaction from Patient Reports in Social Media</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">AE</term>
          <def>
            <p>adverse event</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">ATC</term>
          <def>
            <p>Anatomical Therapeutic Chemical (in ATC classification)</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">FAERS</term>
          <def>
            <p>Food and Drug Administration’ adverse event reporting system</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">FDA</term>
          <def>
            <p>Food and Drug Administration</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">HLGT</term>
          <def>
            <p>high-level group term</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">HLT</term>
          <def>
            <p>high-level term</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb9">MedDRA</term>
          <def>
            <p>Medical Dictionary for Regulatory Activities</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb10">NLP</term>
          <def>
            <p>natural language processing</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb11">PT</term>
          <def>
            <p>preferred term</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb12">SIBM-CISMeF</term>
          <def>
            <p>Biomedicine informatics service catalogue and index of French language medical websites (French Service d’Informatique Biomédicale-Catalogue et Index des Sites Médicaux de langue Française)</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb13">SOC</term>
          <def>
            <p>system organ class</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>This work was labeled in 2013 by the competitiveness cluster Cap Digital and funded by the French General Direction for Enterprises (Direction Générale des Entreprises) and territorial collectivities (Ile de France and Haute Normandie) under the 16th French Unique Interministerial Fund request for proposal through the ADR-PRISM project.</p>
    </ack>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Bates</surname>
            <given-names>DW</given-names>
          </name>
          <name name-style="western">
            <surname>Evans</surname>
            <given-names>RS</given-names>
          </name>
          <name name-style="western">
            <surname>Murff</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Stetson</surname>
            <given-names>PD</given-names>
          </name>
          <name name-style="western">
            <surname>Pizziferri</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Hripcsak</surname>
            <given-names>G</given-names>
          </name>
        </person-group>
        <article-title>Detecting adverse events using information technology</article-title>
        <source>J Am Med Inform Assoc</source>  
        <year>2003</year>  
        <volume>10</volume>  
        <issue>2</issue>  
        <fpage>115</fpage>  
        <lpage>28</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://jamia.oxfordjournals.org/cgi/pmidlookup?view=long&amp;pmid=12595401"/>
        </comment>  
        <pub-id pub-id-type="medline">12595401</pub-id>
        <pub-id pub-id-type="pmcid">PMC150365</pub-id></nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Golomb</surname>
            <given-names>BA</given-names>
          </name>
          <name name-style="western">
            <surname>McGraw</surname>
            <given-names>JJ</given-names>
          </name>
          <name name-style="western">
            <surname>Evans</surname>
            <given-names>MA</given-names>
          </name>
          <name name-style="western">
            <surname>Dimsdale</surname>
            <given-names>JE</given-names>
          </name>
        </person-group>
        <article-title>Physician response to patient reports of adverse drug effects: implications for patient-targeted adverse effect surveillance</article-title>
        <source>Drug Saf</source>  
        <year>2007</year>  
        <volume>30</volume>  
        <issue>8</issue>  
        <fpage>669</fpage>  
        <lpage>75</lpage>  
        <pub-id pub-id-type="doi">10.2165/00002018-200730080-00003</pub-id>
        <pub-id pub-id-type="medline">17696579</pub-id>
        <pub-id pub-id-type="pii">3083</pub-id></nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Hazell</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Shakir</surname>
            <given-names>SA</given-names>
          </name>
        </person-group>
        <article-title>Under-reporting of adverse drug reactions : a systematic review</article-title>
        <source>Drug Saf</source>  
        <year>2006</year>  
        <volume>29</volume>  
        <issue>5</issue>  
        <fpage>385</fpage>  
        <lpage>96</lpage>  
        <pub-id pub-id-type="doi">10.2165/00002018-200629050-00003</pub-id>
        <pub-id pub-id-type="medline">16689555</pub-id>
        <pub-id pub-id-type="pii">2953</pub-id></nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Sarker</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Ginn</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Nikfarjam</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>O'Connor</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Smith</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Jayaraman</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Upadhaya</surname>
            <given-names>T</given-names>
          </name>
          <name name-style="western">
            <surname>Gonzalez</surname>
            <given-names>G</given-names>
          </name>
        </person-group>
        <article-title>Utilizing social media data for pharmacovigilance: a review</article-title>
        <source>J Biomed Inform</source>  
        <year>2015</year>  
        <month>04</month>  
        <volume>54</volume>  
        <fpage>202</fpage>  
        <lpage>12</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://linkinghub.elsevier.com/retrieve/pii/S1532-0464(15)00036-2"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1016/j.jbi.2015.02.004</pub-id>
        <pub-id pub-id-type="medline">25720841</pub-id>
        <pub-id pub-id-type="pii">S1532-0464(15)00036-2</pub-id>
        <pub-id pub-id-type="pmcid">PMC4408239</pub-id></nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Bate</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Lindquist</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Edwards</surname>
            <given-names>IR</given-names>
          </name>
          <name name-style="western">
            <surname>Olsson</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Orre</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Lansner</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>De Freitas</surname>
            <given-names>RM</given-names>
          </name>
        </person-group>
        <article-title>A Bayesian neural network method for adverse drug reaction signal generation</article-title>
        <source>Eur J Clin Pharmacol</source>  
        <year>1998</year>  
        <month>06</month>  
        <volume>54</volume>  
        <issue>4</issue>  
        <fpage>315</fpage>  
        <lpage>21</lpage>  
        <pub-id pub-id-type="medline">9696956</pub-id></nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>DuMouchel</surname>
            <given-names>W</given-names>
          </name>
        </person-group>
        <article-title>Bayesian data mining in large frequency tables, with an application to the FDA spontaneous reporting system</article-title>
        <source>The American Statistician</source>  
        <year>1999</year>  
        <month>08</month>  
        <volume>53</volume>  
        <issue>3</issue>  
        <fpage>177</fpage>  
        <pub-id pub-id-type="doi">10.2307/2686093</pub-id></nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Szarfman</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Machado</surname>
            <given-names>SG</given-names>
          </name>
          <name name-style="western">
            <surname>O'Neill</surname>
            <given-names>RT</given-names>
          </name>
        </person-group>
        <article-title>Use of screening algorithms and computer systems to efficiently signal higher-than-expected combinations of drugs and events in the US FDA's spontaneous reports database</article-title>
        <source>Drug Saf</source>  
        <year>2002</year>  
        <volume>25</volume>  
        <issue>6</issue>  
        <fpage>381</fpage>  
        <lpage>92</lpage>  
        <pub-id pub-id-type="doi">10.2165/00002018-200225060-00001</pub-id>
        <pub-id pub-id-type="medline">12071774</pub-id>
        <pub-id pub-id-type="pii">250601</pub-id></nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>van Puijenbroek</surname>
            <given-names>EP</given-names>
          </name>
          <name name-style="western">
            <surname>Bate</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Leufkens</surname>
            <given-names>HG</given-names>
          </name>
          <name name-style="western">
            <surname>Lindquist</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Orre</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Egberts</surname>
            <given-names>AC</given-names>
          </name>
        </person-group>
        <article-title>A comparison of measures of disproportionality for signal detection in spontaneous reporting systems for adverse drug reactions</article-title>
        <source>Pharmacoepidemiol Drug Saf</source>  
        <year>2002</year>  
        <volume>11</volume>  
        <issue>1</issue>  
        <fpage>3</fpage>  
        <lpage>10</lpage>  
        <pub-id pub-id-type="doi">10.1002/pds.668</pub-id>
        <pub-id pub-id-type="medline">11998548</pub-id></nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Katsahian</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Simond</surname>
            <given-names>ME</given-names>
          </name>
          <name name-style="western">
            <surname>Leprovost</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Lardon</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Bousquet</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Kerdelhué</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Abdellaoui</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Texier</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>Burgun</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Boussadi</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Faviez</surname>
            <given-names>C</given-names>
          </name>
        </person-group>
        <article-title>Evaluation of internet social networks using net scoring tool: a case study in adverse drug reaction mining</article-title>
        <source>Stud Health Technol Inform</source>  
        <year>2015</year>  
        <volume>210</volume>  
        <fpage>526</fpage>  
        <lpage>30</lpage>  
        <pub-id pub-id-type="doi">10.3233/978-1-61499-512-8-526</pub-id>
        <pub-id pub-id-type="medline">25991203</pub-id></nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <collab>ISDB</collab>
        </person-group>
        <source>International Society of Drug Bulletins</source>  
        <year>2005</year>  
        <month>01</month>  
        <access-date>2018-06-29</access-date>
        <publisher-name>ISDB EU</publisher-name>
        <comment>ISDB EU: Berlin Declaration on Pharmacovigilance 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://www.akdae.de/Arzneimittelsicherheit/Weitere/Archiv/2005/85_200501252.pdf">https://www.akdae.de/Arzneimittelsicherheit/Weitere/Archiv/2005/85_200501252.pdf</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="70UZb66y8"/></comment> </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Ho</surname>
            <given-names>T</given-names>
          </name>
          <name name-style="western">
            <surname>Le</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Thai</surname>
            <given-names>DT</given-names>
          </name>
          <name name-style="western">
            <surname>Taewijit</surname>
            <given-names>S</given-names>
          </name>
        </person-group>
        <article-title>Data-driven approach to detect and predict adverse drug reactions</article-title>
        <source>Curr Pharm Des</source>  
        <year>2016</year>  
        <volume>22</volume>  
        <issue>23</issue>  
        <fpage>3498</fpage>  
        <lpage>526</lpage>  
        <pub-id pub-id-type="medline">27157416</pub-id>
        <pub-id pub-id-type="pii">CPD-EPUB-75526</pub-id></nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Wong</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Plasek</surname>
            <given-names>JM</given-names>
          </name>
          <name name-style="western">
            <surname>Montecalvo</surname>
            <given-names>SP</given-names>
          </name>
          <name name-style="western">
            <surname>Zhou</surname>
            <given-names>L</given-names>
          </name>
        </person-group>
        <article-title>Natural language processing and its implications for the future of medication safety: a narrative review of recent advances and challenges</article-title>
        <source>Pharmacotherapy</source>  
        <year>2018</year>  
        <month>06</month>  
        <day>09</day>  
        <volume>38</volume>  
        <issue>8</issue>  
        <fpage>822</fpage>  
        <lpage>41</lpage>  
        <pub-id pub-id-type="doi">10.1002/phar.2151</pub-id>
        <pub-id pub-id-type="medline">29884988</pub-id></nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Tricco</surname>
            <given-names>AC</given-names>
          </name>
          <name name-style="western">
            <surname>Zarin</surname>
            <given-names>W</given-names>
          </name>
          <name name-style="western">
            <surname>Lillie</surname>
            <given-names>E</given-names>
          </name>
          <name name-style="western">
            <surname>Pham</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Straus</surname>
            <given-names>SE</given-names>
          </name>
        </person-group>
        <article-title>Utility of social media and crowd-sourced data for pharmacovigilance: a scoping review protocol</article-title>
        <source>BMJ Open</source>  
        <year>2017</year>  
        <month>12</month>  
        <day>19</day>  
        <volume>7</volume>  
        <issue>1</issue>  
        <fpage>e013474</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://bmjopen.bmj.com/cgi/pmidlookup?view=long&amp;pmid=28104709"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1136/bmjopen-2016-013474</pub-id>
        <pub-id pub-id-type="medline">28104709</pub-id>
        <pub-id pub-id-type="pii">bmjopen-2016-013474</pub-id>
        <pub-id pub-id-type="pmcid">PMC5253521</pub-id></nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Bossuyt</surname>
            <given-names>PM</given-names>
          </name>
          <name name-style="western">
            <surname>Reitsma</surname>
            <given-names>JB</given-names>
          </name>
          <name name-style="western">
            <surname>Bruns</surname>
            <given-names>DE</given-names>
          </name>
          <name name-style="western">
            <surname>Gatsonis</surname>
            <given-names>CA</given-names>
          </name>
          <name name-style="western">
            <surname>Glasziou</surname>
            <given-names>PP</given-names>
          </name>
          <name name-style="western">
            <surname>Irwig</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Lijmer</surname>
            <given-names>JG</given-names>
          </name>
          <name name-style="western">
            <surname>Moher</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Rennie</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>de Vet</surname>
            <given-names>HC</given-names>
          </name>
          <name name-style="western">
            <surname>Kressel</surname>
            <given-names>HY</given-names>
          </name>
          <name name-style="western">
            <surname>Rifai</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>Golub</surname>
            <given-names>RM</given-names>
          </name>
          <name name-style="western">
            <surname>Altman</surname>
            <given-names>DG</given-names>
          </name>
          <name name-style="western">
            <surname>Hooft</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Korevaar</surname>
            <given-names>DA</given-names>
          </name>
          <name name-style="western">
            <surname>Cohen</surname>
            <given-names>JF</given-names>
          </name>
          <collab>STARD Group</collab>
        </person-group>
        <article-title>STARD 2015: an updated list of essential items for reporting diagnostic accuracy studies</article-title>
        <source>BMJ</source>  
        <year>2015</year>  
        <month>10</month>  
        <day>28</day>  
        <volume>351</volume>  
        <fpage>h5527</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://www.bmj.com/cgi/pmidlookup?view=long&amp;pmid=26511519"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1136/bmj.h5527</pub-id>
        <pub-id pub-id-type="medline">26511519</pub-id>
        <pub-id pub-id-type="pmcid">PMC4623764</pub-id></nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Bousquet</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Dahamna</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Guillemin-Lanne</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Darmoni</surname>
            <given-names>SJ</given-names>
          </name>
          <name name-style="western">
            <surname>Faviez</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Huot</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Katsahian</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Leroux</surname>
            <given-names>V</given-names>
          </name>
          <name name-style="western">
            <surname>Pereira</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Richard</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Schück</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Souvignet</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Lillo-Le</surname>
            <given-names>LA</given-names>
          </name>
          <name name-style="western">
            <surname>Texier</surname>
            <given-names>N</given-names>
          </name>
        </person-group>
        <article-title>The adverse drug reactions from patient reports in social media project: five major challenges to overcome to operationalize analysis and efficiently support pharmacovigilance process</article-title>
        <source>JMIR Res Protoc</source>  
        <year>2017</year>  
        <month>09</month>  
        <day>21</day>  
        <volume>6</volume>  
        <issue>9</issue>  
        <fpage>e179</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://www.researchprotocols.org/2017/9/e179/"/>
        </comment>  
        <pub-id pub-id-type="doi">10.2196/resprot.6463</pub-id>
        <pub-id pub-id-type="medline">28935617</pub-id>
        <pub-id pub-id-type="pii">v6i9e179</pub-id>
        <pub-id pub-id-type="pmcid">PMC5629348</pub-id></nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Board</surname>
            <given-names>I</given-names>
          </name>
        </person-group>
        <source>Medical Dictionary for Regulatory Activities</source>  
        <access-date>2018-06-27</access-date>
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://www.meddra.org/">https://www.meddra.org/</ext-link>
          <ext-link ext-link-type="webcite" xlink:href="70Ua4UBNo"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="web">
        <source>Catalog and Index of Medical Sites French-language</source>  
        <access-date>2018-06-27</access-date>
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://www.chu-rouen.fr/cismef/outils/outils-et-services/">http://www.chu-rouen.fr/cismef/outils/outils-et-services/</ext-link>
          <ext-link ext-link-type="webcite" xlink:href="70UYyaz1Q"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="web">
        <source>World Health Organization</source>  
        <access-date>2018-06-27</access-date>
        <comment>ATC/DDD Index 2017 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://www.whocc.no/atc_ddd_index/">https://www.whocc.no/atc_ddd_index/</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="70UXT3c84"/></comment> </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="web">
        <source>Kappa Santé</source>  
        <access-date>2018-06-27</access-date>
        <comment>Pharmaco-epidemiology Interventions in public and numeric health 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://www.kappasante.com/">https://www.kappasante.com/</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="70UZvaGf0"/></comment> </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Kostadinov</surname>
            <given-names>F</given-names>
          </name>
        </person-group>
        <source>GitHub</source>  
        <access-date>2018-06-27</access-date>
        <comment>TEMIS LUXID 7.0.1 SKILL CARTRIDGE DEVELOPMENT CYCLE 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://fabian-kostadinov.github.io/2015/10/04/temis-luxid701-skill-cartridge-development-cycle/">http://fabian-kostadinov.github.io/2015/10/04/temis-luxid701-skill-cartridge-development-cycle/</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="70UXfPs4L"/></comment> </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Chen</surname>
            <given-names>X</given-names>
          </name>
          <name name-style="western">
            <surname>Deldossi</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Aboukhamis</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Faviez</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Dahamna</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Karapetiantz</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Guenegou-Arnoux</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Girardeau</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Guillemin-Lanne</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Lillo-Le-Louët</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Texier</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>Burgun</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Katsahian</surname>
            <given-names>S</given-names>
          </name>
        </person-group>
        <article-title>Mining adverse drug reactions in social media with named entity recognition and semantic methods</article-title>
        <source>Stud Health Technol Inform</source>  
        <year>2017</year>  
        <volume>245</volume>  
        <fpage>322</fpage>  
        <lpage>6</lpage>  
        <pub-id pub-id-type="medline">29295108</pub-id></nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Cavalié</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Djeraba</surname>
            <given-names>A</given-names>
          </name>
        </person-group>
        <source>ANSM [National Agency for the Safety of Medicines and Health Products]</source>  
        <year>2014</year>  
        <access-date>2018-06-27</access-date>
        <comment>[Analysis of drug sales in France in 2013] 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://ansm.sante.fr/var/ansm_site/storage/original/application/3df7b99f8f4c9ee634a6a9b094624341.pdf">https://ansm.sante.fr/var/ansm_site/storage/original/application/3df7b99f8f4c9ee634a6a9b094624341.pdf</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="70UXyC8tD"/></comment> </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Kiritchenko</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Matwin</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Nock</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Famili</surname>
            <given-names>A</given-names>
          </name>
        </person-group>
        <article-title>Learning Evaluation in the Presence of Class Hierarchies: Application to Text Categorization</article-title>
        <year>2006</year>  
        <conf-name>19th Conference of the Canadian Society for Computational Studies of Intelligence</conf-name>
        <conf-date>June 7-9, 2006</conf-date>
        <conf-loc>Québec City, Québec, Canada</conf-loc>
        <publisher-loc>Berlin, Heidelberg</publisher-loc>
        <publisher-name>Springer</publisher-name>
        <fpage>395</fpage>  
        <lpage>406</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://www.svkir.com/papers/Kiritchenko-et-al-hierarchical-AI-2006.pdf"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <collab>R Core Team</collab>
        </person-group>
        <source>R: A language and environment for statistical computing</source>  
        <year>2016</year>  
        <publisher-loc>Vienna, Austria</publisher-loc>
        <publisher-name>R Foundation for Statistical Computing</publisher-name>
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://www.r-project.org/">https://www.r-project.org/</ext-link>
          <ext-link ext-link-type="webcite" xlink:href="77aU4dSIp"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Ginn</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Pimpalkhute</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Nikfarjam</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Patki</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>O'Connor</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Sarker</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Smith</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Gonzalez</surname>
            <given-names>G</given-names>
          </name>
        </person-group>
        <source>Arizona State University</source>  
        <year>2014</year>  
        <access-date>2019-04-01</access-date>
        <comment>Mining Twitter for adverse drug reaction mentions: a corpus and classification benchmark 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://www.nactem.ac.uk/biotxtm2014/papers/Ginnetal.pdf">http://www.nactem.ac.uk/biotxtm2014/papers/Ginnetal.pdf</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="77K671ICh"/></comment> </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Hadzi-Puric</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Grmusa</surname>
            <given-names>J</given-names>
          </name>
        </person-group>
        <article-title>Automatic Drug Adverse Reaction Discovery from Parenting Websites Using Disproportionality Methods</article-title>
        <year>2012</year>  
        <conf-name>IEEE/ACM International Conference on Advances in Social Networks Analysis and Mining</conf-name>
        <conf-date>August 26-29, 2012</conf-date>
        <conf-loc>Istanbul, Turkey</conf-loc>
        <fpage>792</fpage>  
        <lpage>797</lpage>  
        <pub-id pub-id-type="doi">10.1109/ASONAM.2012.144</pub-id></nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Leaman</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Wojtulewicz</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Sullivan</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Skariah</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Yang</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Gonzalez</surname>
            <given-names>G</given-names>
          </name>
        </person-group>
        <article-title>Towards internet-age pharmacovigilance: extracting adverse drug reactions from user posts to health-related social networks</article-title>
        <year>2010</year>  
        <conf-name>Workshop on Biomedical Natural Language Processing (BioNLP 2010) ACL 2010</conf-name>
        <conf-date>July 15, 2010</conf-date>
        <conf-loc>Uppsala, Sweden</conf-loc>
        <fpage>117</fpage>  
        <lpage>125</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://www.aclweb.org/anthology/W10-1915"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Liu</surname>
            <given-names>X</given-names>
          </name>
          <name name-style="western">
            <surname>Chen</surname>
            <given-names>H</given-names>
          </name>
        </person-group>
        <article-title>AZDrugMiner: an information extraction system for mining patient-reported adverse drug events in online patient forums</article-title>
        <year>2013</year>  
        <conf-name>International Conference on Smart Health</conf-name>
        <conf-date>August 3-4, 2013</conf-date>
        <conf-loc>Beijing, China</conf-loc>
        <fpage>134</fpage>  
        <lpage>50</lpage>  
        <pub-id pub-id-type="doi">10.1007/978-3-642-39844-5_16</pub-id></nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Nikfarjam</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Gonzalez</surname>
            <given-names>GH</given-names>
          </name>
        </person-group>
        <article-title>Pattern mining for extraction of mentions of adverse drug reactions from user comments</article-title>
        <source>AMIA Annu Symp Proc</source>  
        <year>2011</year>  
        <volume>2011</volume>  
        <fpage>1019</fpage>  
        <lpage>26</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/22195162"/>
        </comment>  
        <pub-id pub-id-type="medline">22195162</pub-id>
        <pub-id pub-id-type="pmcid">PMC3243273</pub-id></nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Nikfarjam</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Sarker</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>O'Connor</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Ginn</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Gonzalez</surname>
            <given-names>G</given-names>
          </name>
        </person-group>
        <article-title>Pharmacovigilance from social media: mining adverse drug reaction mentions using sequence labeling with word embedding cluster features</article-title>
        <source>J Am Med Inform Assoc</source>  
        <year>2015</year>  
        <month>05</month>  
        <volume>22</volume>  
        <issue>3</issue>  
        <fpage>671</fpage>  
        <lpage>81</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://jamia.oxfordjournals.org/cgi/pmidlookup?view=long&amp;pmid=25755127"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1093/jamia/ocu041</pub-id>
        <pub-id pub-id-type="medline">25755127</pub-id>
        <pub-id pub-id-type="pii">ocu041</pub-id>
        <pub-id pub-id-type="pmcid">PMC4457113</pub-id></nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>O'Connor</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Pimpalkhute</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Nikfarjam</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Ginn</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Smith</surname>
            <given-names>KL</given-names>
          </name>
          <name name-style="western">
            <surname>Gonzalez</surname>
            <given-names>G</given-names>
          </name>
        </person-group>
        <article-title>Pharmacovigilance on Twitter? Mining tweets for adverse drug reactions</article-title>
        <source>AMIA Annu Symp Proc</source>  
        <year>2014</year>  
        <volume>2014</volume>  
        <fpage>924</fpage>  
        <lpage>33</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/25954400"/>
        </comment>  
        <pub-id pub-id-type="medline">25954400</pub-id>
        <pub-id pub-id-type="pmcid">PMC4419871</pub-id></nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Patki</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Sarker</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Pimpalkhute</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Nikfarjam</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Ginn</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Oconnor</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Smith</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Gonzalez</surname>
            <given-names>G</given-names>
          </name>
        </person-group>
        <source>Arizona State University</source>  
        <year>2014</year>  
        <access-date>2019-04-01</access-date>
        <comment>Mining Adverse Drug Reaction Signals from Social Media: Going Beyond Extraction 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://diego.asu.edu/drugstats/Publication_repository/2014/patki_biolinksig/mining%20adverse%20drug%20reaction%20signals%20from%20social%20media-going%20beyond%20extraction.pdf">https://tinyurl.com/y4xwmjco</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="77K6WFaat"/></comment> </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Sampathkumar</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Chen</surname>
            <given-names>X</given-names>
          </name>
          <name name-style="western">
            <surname>Luo</surname>
            <given-names>B</given-names>
          </name>
        </person-group>
        <article-title>Mining adverse drug reactions from online healthcare forums using hidden Markov model</article-title>
        <source>BMC Med Inform Decis Mak</source>  
        <year>2014</year>  
        <volume>14</volume>  
        <fpage>91</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://www.biomedcentral.com/1472-6947/14/91"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1186/1472-6947-14-91</pub-id>
        <pub-id pub-id-type="medline">25341686</pub-id>
        <pub-id pub-id-type="pii">1472-6947-14-91</pub-id>
        <pub-id pub-id-type="pmcid">PMC4283122</pub-id></nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Sarker</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Gonzalez</surname>
            <given-names>G</given-names>
          </name>
        </person-group>
        <article-title>Portable automatic text classification for adverse drug reaction detection via multi-corpus training</article-title>
        <source>J Biomed Inform</source>  
        <year>2015</year>  
        <month>02</month>  
        <volume>53</volume>  
        <fpage>196</fpage>  
        <lpage>207</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://linkinghub.elsevier.com/retrieve/pii/S1532-0464(14)00231-7"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1016/j.jbi.2014.11.002</pub-id>
        <pub-id pub-id-type="medline">25451103</pub-id>
        <pub-id pub-id-type="pii">S1532-0464(14)00231-7</pub-id>
        <pub-id pub-id-type="pmcid">PMC4355323</pub-id></nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Segura-Bedmar</surname>
            <given-names>I</given-names>
          </name>
          <name name-style="western">
            <surname>Revert</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Martínez</surname>
            <given-names>P</given-names>
          </name>
        </person-group>
        <article-title>Detecting drugs and adverse events from Spanish social media streams</article-title>
        <source>Proceedings of the 5th International Workshop on Health Text Mining and Information Analysis (Louhi)</source>  
        <year>2014</year>  
        <conf-name>5th International Workshop on Health Text Mining and Information Analysis (Louhi)</conf-name>
        <conf-date>April 26-30, 2014</conf-date>
        <conf-loc>Gothenburg, Sweden</conf-loc>
        <fpage>106</fpage>  
        <lpage>15</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://www.aclweb.org/anthology/W14-1117"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Yang</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Wang</surname>
            <given-names>X</given-names>
          </name>
          <name name-style="western">
            <surname>Kiang</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <article-title>Identification of Consumer Adverse Drug Reaction Messages on Social Media</article-title>
        <source>PACIS 2013 Proceedings</source>  
        <year>2013</year>  
        <conf-name>The Pacific Asia Conference on Information Systems</conf-name>
        <conf-date>June 18-22, 2013</conf-date>
        <conf-loc>Jeju Island, Korea</conf-loc>
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://aisel.aisnet.org/pacis2013/193"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Yates</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Goharian</surname>
            <given-names>N</given-names>
          </name>
        </person-group>
        <article-title>ADRTrace: detecting expected and unexpected adverse drug reactions from user reviews on social media sites</article-title>
        <year>2013</year>  
        <conf-name>European Conference on Information Retrieval</conf-name>
        <conf-date>March 24-27, 2013</conf-date>
        <conf-loc>Moscow, Russia</conf-loc>
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://link.springer.com/chapter/10.1007/978-3-642-36973-5_92"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1007/978-3-642-36973-5_92</pub-id></nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Benton</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Ungar</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Hill</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Hennessy</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Mao</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Chung</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Leonard</surname>
            <given-names>CE</given-names>
          </name>
          <name name-style="western">
            <surname>Holmes</surname>
            <given-names>JH</given-names>
          </name>
        </person-group>
        <article-title>Identifying potential adverse effects using the web: a new approach to medical hypothesis generation</article-title>
        <source>J Biomed Inform</source>  
        <year>2011</year>  
        <month>12</month>  
        <volume>44</volume>  
        <issue>6</issue>  
        <fpage>989</fpage>  
        <lpage>96</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://linkinghub.elsevier.com/retrieve/pii/S1532-0464(11)00123-7"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1016/j.jbi.2011.07.005</pub-id>
        <pub-id pub-id-type="medline">21820083</pub-id>
        <pub-id pub-id-type="pii">S1532-0464(11)00123-7</pub-id>
        <pub-id pub-id-type="pmcid">PMC4404640</pub-id></nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Bian</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Topaloglu</surname>
            <given-names>U</given-names>
          </name>
          <name name-style="western">
            <surname>Yu</surname>
            <given-names>F</given-names>
          </name>
        </person-group>
        <article-title>Towards large-scale Twitter mining for drug-related adverse events</article-title>
        <source>SHB12 (2012)</source>  
        <year>2012</year>  
        <month>10</month>  
        <day>29</day>  
        <volume>2012</volume>  
        <fpage>25</fpage>  
        <lpage>32</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/28967001"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1145/2389707.2389713</pub-id>
        <pub-id pub-id-type="medline">28967001</pub-id>
        <pub-id pub-id-type="pmcid">PMC5619871</pub-id></nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Chee</surname>
            <given-names>BW</given-names>
          </name>
          <name name-style="western">
            <surname>Berlin</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Schatz</surname>
            <given-names>B</given-names>
          </name>
        </person-group>
        <article-title>Predicting adverse drug events from personal health messages</article-title>
        <source>AMIA Annu Symp Proc</source>  
        <year>2011</year>  
        <volume>2011</volume>  
        <fpage>217</fpage>  
        <lpage>26</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/22195073"/>
        </comment>  
        <pub-id pub-id-type="medline">22195073</pub-id>
        <pub-id pub-id-type="pmcid">PMC3243174</pub-id></nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Freifeld</surname>
            <given-names>CC</given-names>
          </name>
          <name name-style="western">
            <surname>Brownstein</surname>
            <given-names>JS</given-names>
          </name>
          <name name-style="western">
            <surname>Menone</surname>
            <given-names>CM</given-names>
          </name>
          <name name-style="western">
            <surname>Bao</surname>
            <given-names>W</given-names>
          </name>
          <name name-style="western">
            <surname>Filice</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Kass-Hout</surname>
            <given-names>T</given-names>
          </name>
          <name name-style="western">
            <surname>Dasgupta</surname>
            <given-names>N</given-names>
          </name>
        </person-group>
        <article-title>Digital drug safety surveillance: monitoring pharmaceutical products in Twitter</article-title>
        <source>Drug Saf</source>  
        <year>2014</year>  
        <month>05</month>  
        <volume>37</volume>  
        <issue>5</issue>  
        <fpage>343</fpage>  
        <lpage>50</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/24777653"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1007/s40264-014-0155-x</pub-id>
        <pub-id pub-id-type="medline">24777653</pub-id>
        <pub-id pub-id-type="pmcid">PMC4013443</pub-id></nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Jiang</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Zheng</surname>
            <given-names>Y</given-names>
          </name>
        </person-group>
        <article-title>Mining Twitter Data for Potential Drug Effects</article-title>
        <year>2013</year>  
        <conf-name>The 9th International Conference on Advanced Data Mining and Applications (ADMA )</conf-name>
        <conf-date>2013</conf-date>
        <conf-loc>Hangzhou, China</conf-loc>
        <pub-id pub-id-type="doi">10.1007/978-3-642-53914-5_37</pub-id></nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Yang</surname>
            <given-names>CC</given-names>
          </name>
          <name name-style="western">
            <surname>Yang</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Jiang</surname>
            <given-names>L</given-names>
          </name>
        </person-group>
        <article-title>Postmarketing drug safety surveillance using publicly available health-consumer-contributed content in social media</article-title>
        <source>ACM Trans Manage Inf Syst</source>  
        <year>2014</year>  
        <month>04</month>  
        <day>01</day>  
        <volume>5</volume>  
        <issue>1</issue>  
        <fpage>1</fpage>  
        <lpage>21</lpage>  
        <pub-id pub-id-type="doi">10.1145/2576233</pub-id></nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Yang</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Yang</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Jiang</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Zhang</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <article-title>Social media mining for drug safety signal detection</article-title>
        <year>2012</year>  
        <conf-name>Proceedings of the international workshop on Smart healthwellbeing</conf-name>
        <conf-date>Octiber 29, 2012</conf-date>
        <conf-loc>Maui, Hawaii, USA</conf-loc>
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://www.pages.drexel.edu/~hy95/publications/2012SHB.pdf"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Yeleswarapu</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Rao</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Joseph</surname>
            <given-names>T</given-names>
          </name>
          <name name-style="western">
            <surname>Saipradeep</surname>
            <given-names>VG</given-names>
          </name>
          <name name-style="western">
            <surname>Srinivasan</surname>
            <given-names>R</given-names>
          </name>
        </person-group>
        <article-title>A pipeline to extract drug-adverse event pairs from multiple data sources</article-title>
        <source>BMC Med Inform Decis Mak</source>  
        <year>2014</year>  
        <volume>14</volume>  
        <fpage>13</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://www.biomedcentral.com/1472-6947/14/13"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1186/1472-6947-14-13</pub-id>
        <pub-id pub-id-type="medline">24559132</pub-id>
        <pub-id pub-id-type="pii">1472-6947-14-13</pub-id>
        <pub-id pub-id-type="pmcid">PMC3936866</pub-id></nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Bollegala</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Maskell</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Sloane</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Hajne</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Pirmohamed</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <article-title>Causality patterns for detecting adverse drug reactions from social media: text mining approach</article-title>
        <source>JMIR Public Health Surveill</source>  
        <year>2018</year>  
        <month>05</month>  
        <day>09</day>  
        <volume>4</volume>  
        <issue>2</issue>  
        <fpage>e51</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://publichealth.jmir.org/2018/2/e51/"/>
        </comment>  
        <pub-id pub-id-type="doi">10.2196/publichealth.8214</pub-id>
        <pub-id pub-id-type="medline">29743155</pub-id>
        <pub-id pub-id-type="pii">v4i2e51</pub-id>
        <pub-id pub-id-type="pmcid">PMC5966656</pub-id></nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Saeed</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Villarroel</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Reisner</surname>
            <given-names>AT</given-names>
          </name>
          <name name-style="western">
            <surname>Clifford</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Lehman</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Moody</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Heldt</surname>
            <given-names>T</given-names>
          </name>
          <name name-style="western">
            <surname>Kyaw</surname>
            <given-names>TH</given-names>
          </name>
          <name name-style="western">
            <surname>Moody</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Mark</surname>
            <given-names>RG</given-names>
          </name>
        </person-group>
        <article-title>Multiparameter intelligent monitoring in intensive care II: a public-access intensive care unit database</article-title>
        <source>Crit Care Med</source>  
        <year>2011</year>  
        <month>05</month>  
        <volume>39</volume>  
        <issue>5</issue>  
        <fpage>952</fpage>  
        <lpage>60</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/21283005"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1097/CCM.0b013e31820a92c6</pub-id>
        <pub-id pub-id-type="medline">21283005</pub-id>
        <pub-id pub-id-type="pmcid">PMC3124312</pub-id></nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Zhu</surname>
            <given-names>X</given-names>
          </name>
          <name name-style="western">
            <surname>Cherry</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Kiritchenko</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Martin</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>de Bruijn</surname>
            <given-names>B</given-names>
          </name>
        </person-group>
        <article-title>Detecting concept relations in clinical text: insights from a state-of-the-art model</article-title>
        <source>J Biomed Inform</source>  
        <year>2013</year>  
        <month>04</month>  
        <volume>46</volume>  
        <issue>2</issue>  
        <fpage>275</fpage>  
        <lpage>85</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(12)00180-3"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1016/j.jbi.2012.11.006</pub-id>
        <pub-id pub-id-type="medline">23380683</pub-id>
        <pub-id pub-id-type="pii">S1532-0464(12)00180-3</pub-id></nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
