<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMIR</journal-id>
      <journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id>
      <journal-title>Journal of Medical Internet Research</journal-title>
      <issn pub-type="epub">1438-8871</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v21i2e11016</article-id>
      <article-id pub-id-type="pmid">30724742</article-id>
      <article-id pub-id-type="doi">10.2196/11016</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Detecting Potential Adverse Drug Reactions Using a Deep Neural Network Model</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Eysenbach</surname>
            <given-names>Gunther</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Yang</surname>
            <given-names>Hsih-Te</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Li</surname>
            <given-names>Ying</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="author" id="contrib1">
          <name name-style="western">
            <surname>Wang</surname>
            <given-names>Chi-Shiang</given-names>
          </name>
          <degrees>MS</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">http://orcid.org/0000-0002-8707-279X</ext-link>
        </contrib>
        <contrib contrib-type="author" id="contrib2">
          <name name-style="western">
            <surname>Lin</surname>
            <given-names>Pei-Ju</given-names>
          </name>
          <degrees>MS</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">http://orcid.org/0000-0001-6166-1644</ext-link>
        </contrib>
        <contrib contrib-type="author" id="contrib3">
          <name name-style="western">
            <surname>Cheng</surname>
            <given-names>Ching-Lan</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <xref rid="aff3" ref-type="aff">3</xref>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">http://orcid.org/0000-0002-7201-8491</ext-link>
        </contrib>
        <contrib contrib-type="author" id="contrib4">
          <name name-style="western">
            <surname>Tai</surname>
            <given-names>Shu-Hua</given-names>
          </name>
          <degrees>MS</degrees>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">http://orcid.org/0000-0003-3398-5582</ext-link>
        </contrib>
        <contrib contrib-type="author" id="contrib5">
          <name name-style="western">
            <surname>Kao Yang</surname>
            <given-names>Yea-Huei</given-names>
          </name>
          <degrees>BSPharm</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">http://orcid.org/0000-0003-4623-5561</ext-link>
        </contrib>
        <contrib contrib-type="author" id="contrib6" corresp="yes">
          <name name-style="western">
            <surname>Chiang</surname>
            <given-names>Jung-Hsien</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Department of Computer Science and Information Engineering</institution>
            <institution>National Cheng Kung University</institution>
            <addr-line>1 University Road</addr-line>
            <addr-line>Tainan, 701</addr-line>
            <country>Taiwan</country>
            <phone>886 6 2757575 ext 62534</phone>
            <email>jchiang@mail.ncku.edu.tw</email>
          </address>
          <xref rid="aff5" ref-type="aff">5</xref>
          <ext-link ext-link-type="orcid">http://orcid.org/0000-0002-4657-6705</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
      <label>1</label>
      <institution>Department of Computer Science and Information Engineering</institution>
      <institution>National Cheng Kung University</institution>  
      <addr-line>Tainan</addr-line>
      <country>Taiwan</country></aff>
      <aff id="aff2">
      <label>2</label>
      <institution>School of Pharmacy</institution>
      <institution>College of Medicine</institution>  
      <institution>National Cheng Kung University</institution>  
      <addr-line>Tainan</addr-line>
      <country>Taiwan</country></aff>
      <aff id="aff3">
      <label>3</label>
      <institution>Institute of Clinical Pharmacy and Pharmaceutical Sciences</institution>
      <institution>College of Medicine</institution>  
      <institution>National Cheng Kung University</institution>  
      <addr-line>Tainan</addr-line>
      <country>Taiwan</country></aff>
      <aff id="aff4">
      <label>4</label>
      <institution>Department of Pharmacy</institution>
      <institution>National Cheng Kung University Hospital</institution>  
      <institution>National Cheng Kung University</institution>  
      <addr-line>Tainan</addr-line>
      <country>Taiwan</country></aff>
      <aff id="aff5">
      <label>5</label>
      <institution>Institute of Medical Informatics</institution>
      <institution>National Cheng Kung University</institution>  
      <addr-line>Tainan</addr-line>
      <country>Taiwan</country></aff>
      <author-notes>
        <corresp>Corresponding Author: Jung-Hsien Chiang 
        <email>jchiang@mail.ncku.edu.tw</email></corresp>
      </author-notes>
      <pub-date pub-type="collection"><month>02</month><year>2019</year></pub-date>
      <pub-date pub-type="epub">
        <day>06</day>
        <month>02</month>
        <year>2019</year>
      </pub-date>
      <volume>21</volume>
      <issue>2</issue>
      <elocation-id>e11016</elocation-id>
      <!--history from ojs - api-xml-->
      <history>
        <date date-type="received">
          <day>10</day>
          <month>5</month>
          <year>2018</year>
        </date>
        <date date-type="rev-request">
          <day>2</day>
          <month>9</month>
          <year>2018</year>
        </date>
        <date date-type="rev-recd">
          <day>3</day>
          <month>10</month>
          <year>2018</year>
        </date>
        <date date-type="accepted">
          <day>4</day>
          <month>11</month>
          <year>2018</year>
        </date>
      </history>
      <copyright-statement>©Chi-Shiang Wang, Pei-Ju Lin, Ching-Lan Cheng, Shu-Hua Tai, Yea-Huei Kao Yang, Jung-Hsien Chiang. Originally published in the Journal of Medical Internet Research (http://www.jmir.org), 06.02.2019.</copyright-statement>
      <copyright-year>2019</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research, is properly cited. The complete bibliographic information, a link to the original publication on http://www.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="http://www.jmir.org/2019/2/e11016/" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Adverse drug reactions (ADRs) are common and are the underlying cause of over a million serious injuries and deaths each year. The most familiar method to detect ADRs is relying on spontaneous reports. Unfortunately, the low reporting rate of spontaneous reports is a serious limitation of pharmacovigilance.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>The objective of this study was to identify a method to detect potential ADRs of drugs automatically using a deep neural network (DNN).</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>We designed a DNN model that utilizes the chemical, biological, and biomedical information of drugs to detect ADRs. This model aimed to fulfill two main purposes: identifying the potential ADRs of drugs and predicting the possible ADRs of a new drug. For improving the detection performance, we distributed representations of the target drugs in a vector space to capture the drug relationships using the word-embedding approach to process substantial biomedical literature. Moreover, we built a mapping function to address new drugs that do not appear in the dataset.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>Using the drug information and the ADRs reported up to 2009, we predicted the ADRs of drugs recorded up to 2012. There were 746 drugs and 232 new drugs, which were only recorded in 2012 with 1325 ADRs. The experimental results showed that the overall performance of our model with mean average precision at top-10 achieved is 0.523 and the rea under the receiver operating characteristic curve (AUC) score achieved is 0.844 for ADR prediction on the dataset.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>Our model is effective in identifying the potential ADRs of a drug and the possible ADRs of a new drug. Most importantly, it can detect potential ADRs irrespective of whether they have been reported in the past.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>adverse drug reactions</kwd>
        <kwd>deep neural network</kwd>
        <kwd>drug representation</kwd>
        <kwd>machine learning</kwd>
        <kwd>pharmacovigilance</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>An adverse drug reaction (ADR) [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref2">2</xref>] is a serious problem that refers to side effects that occur despite the administration of a regular dose of a drug. It is estimated that over 2 million serious ADRs occur among hospitalized patients, which causes &gt;100,000 deaths each year [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref4">4</xref>]. Unfortunately, it is difficult to identify or predict potential ADRs owing to insufficient data.</p>
      <p>Spontaneous reporting in pre- and postmarket stages are the most familiar methods to identify ADRs early on. Specifically, safety reports from clinical trials are used to list common ADRs in the premarket stage [<xref ref-type="bibr" rid="ref5">5</xref>], while data collected and analyzed from various databases and marketing surveys, such as pharmacovigilance and risk management, are used in the postmarket stage. Although most new ADRs are identified from spontaneous reports, &gt;90% go unreported [<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref7">7</xref>]; this is recognized to be a major limitation. Pharmaceutical companies are trying to avoid side effects in the development stage of drugs. However, although they can identify and address common side effects, it is generally not feasible to identify or predict rare and serious side effects. To overcome these limitations, several studies have utilized a substantial amount of data and various information sources to predict ADRs using statistical methods [<xref ref-type="bibr" rid="ref8">8</xref>] and machine learning approaches [<xref ref-type="bibr" rid="ref9">9</xref>].</p>
      <p>The fundamental method for identifying ADRs pertains to identifying the relationship between drugs and their side effects from diverse sources of information [<xref ref-type="bibr" rid="ref10">10</xref>-<xref ref-type="bibr" rid="ref12">12</xref>] such as clinical trials, electronic medical records (EMRs), social media, and biomedical literature. For instance, PubMed contains valuable information that could aid ADR detection. Karimi et al [<xref ref-type="bibr" rid="ref13">13</xref>] reviewed data mining and techniques related to computer science, which have been studied in the area of drug safety to identify reports of ADR from different sources. Tatonetti et al [<xref ref-type="bibr" rid="ref14">14</xref>] proposed a novel algorithm for building a predictive model that can detect hidden interactions in adverse event reports to infer unreported adverse events. Wang et al [<xref ref-type="bibr" rid="ref15">15</xref>] developed a model for identifying ADRs using data mining to extract information from millions of EMRs. It used clinical notes with information on specific drugs and known adverse drug events (ADEs) that have been preprocessed using statistical methods to compute the probability that a given drug-disorder pair represents a valid ADE association. This method automatically determines whether a specific adverse event is caused by a specific drug based on the content of PubMed citations [<xref ref-type="bibr" rid="ref16">16</xref>]. Finkelstein et al [<xref ref-type="bibr" rid="ref17">17</xref>] developed a tool to automatically detect and summarize information on ADRs from journal papers. It then ranked the ADRs of a drug on a user-friendly interface for physicians.</p>
      <p>Several studies have utilized either chemical or molecular pathways of drugs to predict ADRs [<xref ref-type="bibr" rid="ref18">18</xref>]. Cami et al [<xref ref-type="bibr" rid="ref19">19</xref>] developed a novel approach to predict ADEs by using information on specific drugs and the adverse event to predict likely unknown ADEs. Lorberbaum et al [<xref ref-type="bibr" rid="ref20">20</xref>] hypothesized that systems biology and chemical genomics data can improve drug safety surveillance by highlighting drugs with a mechanistic connection to the target phenotype and by filtering those which do not. They presented an algorithm, the modular assembly of drug safety subnetworks, to combine systems pharmacology and pharmacovigilance data. The algorithm markedly improved drug safety monitoring for 4 clinically relevant ADRs. Huang et al [<xref ref-type="bibr" rid="ref21">21</xref>] proposed a framework for predicting ADR profiles by integrating protein-protein interaction networks with drug structures. Some researchers utilized the chemical, biological, and phenotypic characteristics of drugs to predict the ADRs. Liu et al [<xref ref-type="bibr" rid="ref22">22</xref>] proposed a machine learning approach for predicting the ADRs by integrating the phenotypic characteristics, which included chemical structure, biological properties, and protein target and pathway information.</p>
      <p>However, most of those approaches rely on heavily handcrafted features and treat ADR identification as a classification problem, which does not take the order of the ADRs discovered into consideration. Therefore, the process tends to be more expensive and leads to the loss of significant information on drug-ADR relationships in the model training phase. Furthermore, these approaches are unable to predict the ADR of new drugs, thus rendering the detection of ADR more difficult [<xref ref-type="bibr" rid="ref19">19</xref>].</p>
      <p>To address these limitations, we used a deep neural network (DNN) model for the detection of ADRs of drugs. The model has 2 purposes: the identification of ADRs, which entailed the discovery of potential ADRs of a drug from known ADR records, and the prediction of ADRs, which pertained to predicting the possible ADRs for a new drug. We used the word-embedding approach and mapping function to process new drugs that did not appear in the dataset. Furthermore, we examined the overall performance of the model with various feature combinations and the number of hidden layers in the DNN architecture.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Data Description</title>
        <p>To develop and evaluate a DNN model, we used data from Side Effect Resource (SIDER) [<xref ref-type="bibr" rid="ref23">23</xref>], a database of drugs with side effects, which contains information on medicines in the market since 2009 and their recorded ADRs [<xref ref-type="bibr" rid="ref24">24</xref>]. We collected the ADR information from 2009 and 2012 from SIDER to represent the simulated prospective approach. In total, 746 drugs and 1325 side effect terms related to these drugs were recorded in both years. Additional 232 drugs appeared only in the 2012 dataset as new drugs. It is important to monitor the ADRs of drugs throughout their life cycle, from the preclinical research phase to postmarket surveillance. The fundamental properties of drugs rely on preclinical <italic>in vitro</italic> safety profiling that involves the testing of compounds with chemical and biological properties. Therefore, we extracted these properties as a part of the features in the model. We extracted the 17 molecular descriptors of drugs from PubChem [<xref ref-type="bibr" rid="ref25">25</xref>] (<xref ref-type="boxed-text" rid="box1">Textbox 1</xref>). We utilized the biological features from DrugBank [<xref ref-type="bibr" rid="ref26">26</xref>] to represent the biomolecular interactions and pathways. These features contain the targets, enzymes, transporters, and carriers of each drug and their actions.</p>
        <p>For enriching the scientific evidence and enhancing the detection of ADRs, we collected millions of papers from the Medical Literature Analysis and Retrieval System Online (MEDLINE) [<xref ref-type="bibr" rid="ref27">27</xref>] to be used as auxiliary data to enrich the information about each drug. We used the name of each drug as the query term and selected all the papers related to the drug, published before 2009, such as case reports, clinical trials, and observational studies. The reason for collecting the papers published before 2009 is that we wanted to simulate the progress of drug surveillance from 2009 to 2012.</p>
        <boxed-text id="box1" position="float">
          <title>The 17 molecular descriptors for the chemical features identified in this study.</title>
          <list list-type="order">
            <list-item>
              <p>Molecular Weight</p>
            </list-item>
            <list-item>
              <p>XLogP3</p>
            </list-item>
            <list-item>
              <p>Hydrogen Bond Donor Count</p>
            </list-item>
            <list-item>
              <p>Hydrogen Bond Acceptor Count</p>
            </list-item>
            <list-item>
              <p>Rotatable Bond Count</p>
            </list-item>
            <list-item>
              <p>Exact Mass</p>
            </list-item>
            <list-item>
              <p>Monoisotopic Mass</p>
            </list-item>
            <list-item>
              <p>Topological Polar Surface Area</p>
            </list-item>
            <list-item>
              <p>Heavy Atom Count</p>
            </list-item>
            <list-item>
              <p>Formal Charge</p>
            </list-item>
            <list-item>
              <p>Complexity</p>
            </list-item>
            <list-item>
              <p>Isotope Atom Count</p>
            </list-item>
            <list-item>
              <p>Defined Atom Stereocenter Count</p>
            </list-item>
            <list-item>
              <p>Undefined Atom Stereocenter Count</p>
            </list-item>
            <list-item>
              <p>Defined Bond Stereocenter Count</p>
            </list-item>
            <list-item>
              <p>Undefined Bond Stereocenter Count</p>
            </list-item>
            <list-item>
              <p>Covalently- Bonded Unit Count</p>
            </list-item>
          </list>
        </boxed-text>
      </sec>
      <sec>
        <title>Features of Drug Description</title>
        <p>We treated ADR identification as an information retrieval problem, such that our model could discover the potential relationships between each drug and the 1325 side effects recorded. We represented the prediction target of 1325 dimensions with a binary profile of elements corresponding to the presence or absence of side effects with 1 or 0, <italic>Y</italic> ∈ ℕ<sup><italic>n</italic> </sup><sup>×1325</sup> with <italic>n</italic> being the number of drugs. Each drug was associated with 3 types of features: the chemical properties, biological properties, and information from the literature. In addition, the known ADR records of drugs were included. After preprocessing, we filtered out 2 empty properties: the Isotope Atom Count and the Undefined Bond Stereocenter Count. Subsequently, the feature of chemical properties was represented using a 15-dimensional vector, with <italic>X</italic><sub>Chem</sub> ∈ ℝ<sup><italic>n</italic> </sup><sup>×15</sup> for each element. The biological properties, extracted from DrugBank, contained 4 phases of information including the carriers, enzymes (for drug metabolism), protein targets, and transporters (for drug transportation). After preprocessing, we utilized the biological information to represent each drug with the 1048-dimensional vector, which included 788 protein targets, 162 enzymes, 85 transporters, and 13 carriers, with <italic>X</italic><sub>Bio</sub> ∈ ℕ<sup><italic>n</italic> </sup><sup>×1048</sup> for different action types in each element. The known ADR records of a drug played an important role in identifying potential ADRs. Thus, we leveraged this information to predict potential ADRs that appeared in 2012.</p>
        <p>The biomedical literature played an important role in this study because it contains a large amount of information related to drugs and ADRs such as clinical notes and case reports. However, one of the issues in extracting the drug information from biomedical literature is the uncertainty regarding which words or documents represent the drug. Therefore, we trained the model to understand the semantic features of drugs from 2.3 million biomedical papers on 764 drugs introduced before 2009 by utilizing one of the most popular embedding methods Word2Vec [<xref ref-type="bibr" rid="ref28">28</xref>-<xref ref-type="bibr" rid="ref30">30</xref>] to model it using the skip-gram model. Subsequently, we used the vector of the drug name as the drug vector (drug2vec, D2V), <italic>X</italic><sub>D2V</sub> ∈ ℝ<sup><italic>n</italic> </sup><sup>×400</sup>, with <italic>n</italic> being the number of drugs. We observed that the features represented by D2V were more comprehensive than the intrinsic features in the experiments. However, as we used drug names as the query term, we could not identify papers related to 232 new drugs. To address drugs that were not observed during the embedding training step, we expanded the D2V by introducing a drug description mapping function. Using <italic>V</italic><sub>D2V</sub> to denote the word-embedding space of the drug vector existing in the training and <italic>V</italic><sub>DDV</sub> to denote the new drug description vector the summation of each word vector related to the new drug in the papers, the mapping function <italic>f</italic> (<italic>v</italic>): <italic>V</italic><sub>DDV</sub>→ <italic>V</italic><sub>D2V</sub> was developed and parameterized by a <italic>W</italic>, such that <italic>v′=Wv</italic> for <italic>v</italic> ∈ <italic>V</italic><sub>DDV</sub> and <italic>v′</italic> ∈ <italic>V</italic><sub>D2V</sub> [<xref ref-type="bibr" rid="ref31">31</xref>] using the least absolute shrinkage and selection operator regression for training the <italic>W</italic> [<xref ref-type="bibr" rid="ref32">32</xref>]. This expansion method enabled the model to process new drugs, making it more flexible.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>The architecture of the deep neural network model for predicting and identifying the possible adverse drug reactions (ADRs) of a drug. After predicting, we generated a list of possible ADRs of a drug by ranking the probability of ADRs from the output in the model.</p>
          </caption>
          <graphic xlink:href="jmir_v21i2e11016_fig1.PNG" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Feature representation of adverse drug reaction (ADR) identification and prediction.</p>
          </caption>
          <graphic xlink:href="jmir_v21i2e11016_fig2.PNG" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
      <title>Adverse Drug Reaction Detection Deep Neural Network Model Description</title>
      <p>We designed a DNN model that can identify and predict the ADRs of a drug with different requirements. This model (<xref ref-type="fig" rid="figure1">Figure 1</xref>) was based on one of the common DNN architectures, multilayer perceptron [<xref ref-type="bibr" rid="ref33">33</xref>], which has been successfully applied in several prior studies. We added the dropout layer between each dense layer to avoid model overfitting in the training step [<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref35">35</xref>]. The process of the nonlinear transformation in each layer ensured that the model could learn more information from the input data. The model aimed at identifying and predicting potential ADRs of a drug. The identification function is fulfilled by seeking the potential ADRs of drugs by using known records of ADRs and various features of drugs. The prediction function pertains to the detection of potential ADRs of new drugs. We designed 2 kinds of feature representations (<xref ref-type="fig" rid="figure2">Figure 2</xref>) to distinguish the tasks of identification and prediction. In prediction, we assumed that the ADR record for a new drug was empty. Therefore, the feature of known ADR records with zero indicated that the possible ADRs of new drugs relied only on the semantic feature (drug2vec), chemical properties, and biological properties.</p>  
      <p>We treated the identification task as an information retrieval problem because drugs may have more than one ADR. Therefore, we designed the last layer with 1325 hidden nodes, which was equal to the number of ADRs in the dataset. Evaluating the probability of ADR <italic>y</italic> of a given drug <italic>x</italic>, we defined the <italic>p</italic> (<italic>y</italic> ∣ <italic>x</italic>) = σ(<italic>Wh</italic> + <italic>b</italic>), σ as the sigmoid function, to transfer the hidden vector <italic>h</italic> to the value between 0 and 1. We learned the <italic>p</italic> (<italic>y</italic> ∣ <italic>x</italic>) by minimizing the cross-entropy with <italic>D</italic>. When θ denoted all parameters of the model, the objective function ℒ(<italic>D</italic>, θ) was formulated as follows:</p>
      
      
      <disp-formula>ℒ(<italic>D</italic>, θ) = −<italic>Summation</italic> (<italic>y<sub>i</sub> log</italic> [<italic>p</italic> (<italic>y|x</italic>)] + [<italic>1−y<sub>i</sub></italic>] <italic>log</italic> [<italic>1−p</italic> (<italic>y|x</italic>]) / N</disp-formula>
      
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <p>In this study, we present a detailed analysis of the performance of our DNN model. Let <italic>Q</italic> denote the number of drugs in the dataset. We evaluated the model using the area under the receiver operating characteristic curve, shown in <xref ref-type="table" rid="table1">Table 1</xref>, and the mean average precision (MAP) <italic>AvePrecision</italic> (<italic>q</italic>)/<italic>Q</italic>, which has been widely used in multilabel problem and information retrieval evaluation. First, we assessed the abilities of different feature combinations to detect the ADRs of drugs. We examined the performance of our model with reference to the features presented in <xref ref-type="fig" rid="figure3">Figure 3</xref> (image on the left). The drug features included the biological, chemical, and D2V features. The chemical feature was found to perform poorly because of the duplicate and indistinguishable chemical properties extracted.</p>
      <p>Moreover, we removed the D2V and kept the other features to train the model. The results showed that the D2V was most informative, possibly because the D2V learned the valuable information from millions of papers. We then focused on method comparison with several common methods. We compared the abilities of 3 machine learning methods, namely, probability matrix factorization (PMF), Linear Support Vector Classifier, and Gaussian Naïve Bayes [<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref37">37</xref>], to predict and identify the ADRs of drugs. <xref ref-type="fig" rid="figure3">Figure 3</xref> (image on the right) shows the performance of different models based on 5-fold cross-validation using all biological, chemical, and D2V properties as features, except PMF. The PMF exhibited the worst performance because it considered the relationship between drugs and ADRs only based on latent information. One of the reasons why our model outperforms others is that the features of a drug enrich the information via the nonlinear transformation in deep learning.</p>
      <p>Subsequently, we investigated whether our model could process the specific tasks of prediction and identification. The performance on the prediction task (<xref ref-type="fig" rid="figure4">Figure 4</xref>, image on the left) exceeded that on the identification task. The identification task is more difficult than prediction because the former entails the detection of potentially rare ADRs. Although the identification function of this model could be improved, its overall performance revealed its capacity to address both tasks simultaneously.</p>
      <p>In addition, we plotted the performance of the model with a different number of hidden layers (<xref ref-type="fig" rid="figure4">Figure 4</xref>, image on the right). The performance of the model did not improve with an increase in the number of hidden layers. The model with 2 hidden layers was better than the others. Specifically, with the limited data size for 3 hidden layers, the model was unable to learn the good parameters from the data. Evidently, the number of hidden layers relies on data properties and the amount of data in the DNN.</p>
      <p>To evaluate our mapping function, we examined the drug expansion through the transfer of drug description to the D2V. The results, shown in <xref ref-type="table" rid="table2">Table 2</xref>, indicated that our mapping function could fit the performance of the D2V. The performance of the drug description through the mapping function was slightly better than that of D2V, possibly because some drugs did not exist in the space of D2V. This finding indicates that this model cannot predict the ADRs of such drugs without the mapping function. Accordingly, the mapping function was found to render the model more flexible to address new drugs.</p>
      <table-wrap position="float" id="table1">
        <label>Table 1</label>
        <caption>
          <p>The result showing the performance of model evaluated by area under the receiver operating characteristic curve (AUC).</p>
        </caption>
        <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="900"/>
          <col width="100"/>
          <thead>
            <tr valign="top">
              <td>Model</td>
              <td>AUC</td>
            </tr>
          </thead>
          <tbody>
            <tr valign="top">
              <td>Probability matrix factorization</td>
              <td>0.500</td>
            </tr>
            <tr valign="top">
              <td>Linear Support Vector Classifier</td>
              <td>0.523</td>
            </tr>
            <tr valign="top">
              <td>Gaussian Naïve Bayes</td>
              <td>0.597</td>
            </tr>
            <tr valign="top">
              <td>Deep neural network adverse drug reaction (DNN ADR) without hidden layer</td>
              <td>0.641</td>
            </tr>
            <tr valign="top">
              <td>DNN ADR with 1 hidden layer</td>
              <td>0.823</td>
            </tr>
            <tr valign="bottom">
              <td>DNN ADR with 2 hidden layers</td>
              <td><italic>0.844<sup>a</sup></italic></td>
            </tr>
            <tr valign="top">
              <td>DNN ADR with 3 hidden layers</td>
              <td>0.814</td>
            </tr>
            <tr valign="top">
              <td>DNN ADR without Bio features</td>
              <td>0.823</td>
            </tr>
            <tr valign="top">
              <td>DNN ADR without Chem features</td>
              <td>0.837</td>
            </tr>
            <tr valign="top">
              <td>DNN ADR without drug2vec features</td>
              <td>0.803</td>
            </tr>
            <tr valign="top">
              <td>DNN ADR</td>
              <td><italic>0.844</italic></td>
            </tr>
          </tbody>
        </table>
        <table-wrap-foot>
          <fn id="table1fn1">
            <p><sup>a</sup>The italicized values indicate the best results in this comparison.</p>
          </fn>
        </table-wrap-foot>
      </table-wrap>
      <fig id="figure3" position="float">
        <label>Figure 3</label>
        <caption>
          <p>Left: Effects of different feature combinations to detect the adverse drug reactions (ADRs) of drugs; right: A comparison of our deep neural network (DNN) model with various machine learning approaches. PMF: probability matrix factorization; LinearSVC: Linear Support Vector Classifier; GaussianNB: Gaussian Naïve Bayes.</p>
        </caption>
        <graphic xlink:href="jmir_v21i2e11016_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
      </fig>
      <fig id="figure4" position="float">
        <label>Figure 4</label>
        <caption>
          <p>Left: Performance of the deep neural network (DNN) model on the adverse drug reaction (ADR) identification and prediction tasks and the overall performance; right: In this experiment, we showed the performance of the model with several different layers. GaussianNB: Gaussian Naïve Bayes; LinearSVC: Linear Support Vector Classifier.</p>
        </caption>
        <graphic xlink:href="jmir_v21i2e11016_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
      </fig>
      <table-wrap position="float" id="table2">
        <label>Table 2</label>
        <caption>
          <p>The results showing the ability of the mapping function to transfer the drug description to drug2vec with Mean Average Precision at Top N (MAP@N).</p>
        </caption>
        <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="400"/>
          <col width="100"/>
          <col width="100"/>
          <col width="100"/>
          <col width="100"/>
          <col width="100"/>
          <col width="100"/>
          <thead>
            <tr valign="top">
              <td>MAP@N</td>
              <td>1</td>
              <td>3</td>
              <td>5</td>
              <td>10</td>
              <td>15</td>
              <td>20</td>
            </tr>
          </thead>
          <tbody>
            <tr valign="bottom">
              <td>Mapping function</td>
              <td><italic>0.068<sup>a</sup></italic></td>
              <td><italic>0.179</italic></td>
              <td><italic>0.272</italic></td>
              <td><italic>0.462</italic></td>
              <td><italic>0.462</italic></td>
              <td><italic>0.462</italic></td>
            </tr>
            <tr valign="top">
              <td>drug2vec</td>
              <td>0.065</td>
              <td>0.174</td>
              <td>0.267</td>
              <td>0.453</td>
              <td>0.453</td>
              <td>0.453</td>
            </tr>
          </tbody>
        </table>
        <table-wrap-foot>
          <fn id="table2fn1">
            <p><sup>a</sup>The italicized values indicate the best results in this comparison.</p>
          </fn>
        </table-wrap-foot>
      </table-wrap>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
      <title>Principal Findings</title>
      <p>In this study, we aimed to increase the diversity of information on drugs to improve our ability to detect ADRs. Accordingly, we extracted information from the chemical and biological properties of drugs and from the existing biomedical literature. The MEDLINE was selected as the source for biomedical literature to identify important auxiliary data because it contains several types of biomedical papers, such as clinical trials, case reports, and observational studies, related to drugs. However, it was difficult to use keywords to identify specific drugs from millions of papers and words. Therefore, we utilized 2.3 million biomedical papers to identify the semantic features of drug using the skip-gram model in Word2Vec. In particular, for a central word <italic>w</italic><sub><italic>t</italic> </sub> under consideration, the probability <italic>p</italic> (<italic>w</italic><sub><italic>t</italic> </sub><sub>±</sub><sub><italic>i</italic> </sub>∣ <italic>w</italic><sub><italic>t</italic> </sub>) of predicting the surrounding word <italic>w</italic><sub><italic>t</italic> </sub><sub>±</sub><sub><italic>i</italic> </sub> depended on the <italic>w</italic><sub><italic>t</italic> </sub>. The subscript <italic>t</italic> indicates a target word, such as the drug name “Dantrolene,” and the <italic>i</italic> represented the windows size of the target word. This feature helped us extract the latent information of each word, including the words comprising the drug’s name. After this word-embedding training, we investigated whether the semantic feature (D2V) could represent the properties of drugs, such as biomedical and chemical properties. We visualized the relationships between the learned drug-embedding vectors based on their similarity (<xref ref-type="fig" rid="figure5">Figure 5</xref>). This graph included 746 drugs and presented the relationship of these drugs with those of the latent information learned from the semantic feature. Each node presents a drug and the edge represents the similarity between other drugs. The more similar the drugs in each pair were, the closer they were in the graph. The larger nodes represented the drugs that were more similar to other drugs. We found that the model seems to cluster the drugs used in specific treatments.</p>
      <fig id="figure5" position="float">
        <label>Figure 5</label>
        <caption>
          <p>Relationship between drugs using the semantic feature (drug2vec) of the deep neural network model. There were 746 nodes in this graph, each representing a drug. The clusters indicated the drugs with a specific treatment. Top: The cluster comprised antidepressants; middle: The cluster contained antibiotics; bottom: The cluster included ophthalmic medications.</p>
        </caption>
        <graphic xlink:href="jmir_v21i2e11016_fig5.PNG" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
      </fig>
      <p>For instance, the drugs in the cluster with the blue circle shown in <xref ref-type="fig" rid="figure5">Figure 5</xref> (image on the top) comprised antidepressants such as trazodone, citalopram, clomipramine, and paroxetine. The cluster to the right contained antibiotics such as ampicillin, ceftazidime, cefpodoxime, and cefotaxime shown is <xref ref-type="fig" rid="figure5">Figure 5</xref> (image in the middle). Moreover, the cluster at the bottom included ophthalmic medications such as fluorometholone, levocabastine, brinzolamide, and dipiverfrin (<xref ref-type="fig" rid="figure5">Figure 5</xref>, image at the bottom). There were other small clusters with their own specific treatment. Thus, we learned the relationships among drugs and the latent information from the papers included in the embedding function at the text-level. Accordingly, the semantic feature had a great effect on the performance of our model.</p>
      <p>Subsequently, we examined the ability of this model to perform its identification and prediction functions with reference to serious ADRs defined by the Micromedex. Using the identification function of the model, we ranked the potential ADRs in a list by the probability of their occurrence (<xref ref-type="table" rid="table3">Table 3</xref>). One of the reasons why the probability of ADR presented in <xref ref-type="table" rid="table3">Table 3</xref> was not highly prominent was that the positive samples of these ADRs were rarely reported in this dataset. However, our model could identify that hydroxychloroquine led to muscle cramps, which is a serious ADR that occurs in severe neuromuscular disease. In addition, we extracted 5 drugs that were recorded only in 2012 to examine the prediction function of this model.</p>  
      <table-wrap position="float" id="table3">
        <label>Table 3</label>
        <caption>
          <p>The adverse drug reaction (ADR) prediction and identification results of the model.</p>
        </caption>
        <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="30"/>
          <col width="570"/>
          <col width="200"/>
          <col width="80"/>
          <col width="120"/>
          <thead>
            <tr valign="top">
              <td colspan="2">Drug</td>
              <td>Serious ADR</td>
              <td>Rank</td>
              <td>Probability</td>
            </tr>
          </thead>
          <tbody>
            <tr valign="top">
              <td colspan="5"><bold>Identification results of drugs with known ADR records</bold></td>
            </tr>
            <tr valign="top">
              <td><break/></td>
              <td>Dantrolene</td>
              <td>Anemia</td>
              <td>12</td>
              <td>0.012</td>
            </tr>
            <tr valign="top">
              <td><break/></td>
              <td>Dantrolene</td>
              <td>Congestive heart failure</td>
              <td>15</td>
              <td>0.009</td>
            </tr>
            <tr valign="top">
              <td><break/></td>
              <td>Hydroxychloroquine</td>
              <td>Muscle Cramp</td>
              <td>1</td>
              <td>0.997</td>
            </tr>
            <tr valign="top">
              <td><break/></td>
              <td>Hydroxychloroquine</td>
              <td>Photophobia</td>
              <td>16</td>
              <td>0.017</td>
            </tr>
            <tr valign="top">
              <td><break/></td>
              <td>19-nortestosterone</td>
              <td>Serum cholesterol raised</td>
              <td>4</td>
              <td>0.150</td>
            </tr>
            <tr valign="top">
              <td><break/></td>
              <td>Carbachol</td>
              <td>Retinal detachment</td>
              <td>3</td>
              <td>0.690</td>
            </tr>
            <tr valign="top">
              <td colspan="5"><bold>Prediction results of drugs without ADR records</bold></td>
            </tr>
            <tr valign="top">
              <td><break/></td>
              <td>Atazanavir</td>
              <td>Anemia</td>
              <td>17</td>
              <td>0.920</td>
            </tr>
            <tr valign="top">
              <td><break/></td>
              <td>Carbinoxamine maleate</td>
              <td>Agranulocytosis</td>
              <td>14</td>
              <td>0.453</td>
            </tr>
            <tr valign="top">
              <td><break/></td>
              <td>Carbinoxamine maleate</td>
              <td>Anemia, Hemolytic</td>
              <td>16</td>
              <td>0.340</td>
            </tr>
            <tr valign="top">
              <td><break/></td>
              <td>Darunavir</td>
              <td>Hyperglycemia</td>
              <td>20</td>
              <td>0.750</td>
            </tr>
            <tr valign="top">
              <td><break/></td>
              <td>Temsirolimus</td>
              <td>Infection</td>
              <td>20</td>
              <td>0.974</td>
            </tr>
            <tr valign="top">
              <td><break/></td>
              <td>Zoladex</td>
              <td>Myocardial infarction</td>
              <td>7</td>
              <td>0.961</td>
            </tr>
            <tr valign="top">
              <td><break/></td>
              <td>Zoladex</td>
              <td>Hypersensitivity</td>
              <td>12</td>
              <td>0.920</td>
            </tr>
          </tbody>
        </table>
      </table-wrap>
      <p>Findings revealed that our model has the capacity to predict the serious ADRs of new drugs. For instance, the model predicted that Zoladex could lead to a serious ADR, myocardial infarction, which is one of the commonest causes of death in developing countries.</p></sec>
      <sec>
        <title>Limitations</title>
        <p>This study has several limitations that need to be addressed in future studies. First, data diversity plays an important role in the model. We only used the data published in SIDER. Our model will be more persuasive and reliable if we can include more data from different datasets. Because the chemical and biological properties of drugs contribute most to their effects on human, the more the databases of drug properties included, the better the performance of our model. On the other hand, if we have access to more open-source data, including clinical trials, spontaneous reporting systems, and EMRs with support from government and pharmaceutical industry, our model will have better prediction. Furthermore, our model focused on the ADR prediction and identification. To identify the probability of occurrence of each ADR, we set 1325 hidden nodes and the total number of ADRs in the dataset in the output layer. In other words, although we had a mapping function to address new drugs, this model could only predict existing ADRs. Therefore, in the future work, we plan to utilize more detailed features such as drug-ADR interaction [<xref ref-type="bibr" rid="ref13">13</xref>], drug-drug interaction, and ADR-ADR interaction networks for the prediction of ADRs. Furthermore, we also plan to investigate other embedding approaches to represent the ADRs to help predict the relationships between drugs and new ADRs.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>We developed a novel ADR detection model based on the biological and chemical properties of drugs and the D2V (the semantic feature). After discussing the drug similarities with domain experts from the National Cheng Kung University Hospital and the Institute of Clinical Pharmacy and Pharmaceutical Sciences, we found out that the D2V can represent a characteristic of the drug. Our model could not only discover the potential ADRs of drugs but also predict the possible ADRs of new drugs. To discover potential ADRs based on the previous records, our model could identify the hidden relationship between ADR-ADR interactions. Furthermore, to predict the possible ADRs of a new drug without any previous ADR records, using the D2V feature, our mapping function exhibited good profiling for transferring the drug description into the D2V. The model exhibited good performance on both tasks and generated the most suitable results. It will help pharmacists and health care providers to understand the potential risk of side effect of drugs and address the issue of underreporting of spontaneous reports. Above all, our model will aid pharmacovigilance by identifying and predicting potential ADRs.</p>
      </sec>
    </sec>
  </body>
  <back>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb0">ADE</term>
          <def>
            <p>adverse drug events</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb1">ADR</term>
          <def>
            <p>adverse drug reaction</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">AUC</term>
          <def>
            <p>area under the receiver operating characteristic curve</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">DNN</term>
          <def>
            <p>deep neural network</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">EMR</term>
          <def>
            <p>electronic medical records</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">MAP</term>
          <def>
            <p>mean average precision</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">MEDLINE</term>
          <def>
            <p>Medical Literature Analysis and Retrieval System Online</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">PMF</term>
          <def>
            <p>probability matrix factorization</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">SIDER</term>
          <def>
            <p>Side Effect Resource</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>The authors would like to express their great appreciation to the Ministry of Science and Technology (MOST) and the Ministry of Health and Welfare (MOHW) for their support (grant numbers: MOST 104-2923-E-006-003-MY3, MOST 107-2634-F-006-006, and MOHW105-FDA-D-113-000416). The authors would also like to appreciate Yung-Hsin Tseng, a master’s student, who was involved in conventional test and case study.</p>
    </ack>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Coleman</surname>
            <given-names>JJ</given-names>
          </name>
          <name name-style="western">
            <surname>Pontefract</surname>
            <given-names>SK</given-names>
          </name>
        </person-group>
        <article-title>Adverse drug reactions</article-title>
        <source>Clin Med (Lond)</source>  
        <year>2016</year>  
        <month>10</month>  
        <volume>16</volume>  
        <issue>5</issue>  
        <fpage>481</fpage>  
        <lpage>485</lpage>  
        <pub-id pub-id-type="doi">10.7861/clinmedicine.16-5-481</pub-id>
        <pub-id pub-id-type="medline">27697815</pub-id>
        <pub-id pub-id-type="pii">16/5/481</pub-id></nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Edwards</surname>
            <given-names>IR</given-names>
          </name>
          <name name-style="western">
            <surname>Aronson</surname>
            <given-names>JK</given-names>
          </name>
        </person-group>
        <article-title>Adverse drug reactions: definitions, diagnosis, and management</article-title>
        <source>Lancet</source>  
        <year>2000</year>  
        <month>10</month>  
        <day>07</day>  
        <volume>356</volume>  
        <issue>9237</issue>  
        <fpage>1255</fpage>  
        <lpage>9</lpage>  
        <pub-id pub-id-type="doi">10.1016/S0140-6736(00)02799-9</pub-id>
        <pub-id pub-id-type="medline">11072960</pub-id>
        <pub-id pub-id-type="pii">S0140-6736(00)02799-9</pub-id></nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Couper</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <source>World Health Organization</source>  
        <year>2002</year>  
        <access-date>2018-11-30</access-date>
        <comment>Safety of Medicines: A guide to detecting and reporting adverse drug reactions 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://apps.who.int/iris/bitstream/handle/10665/67378/WHO_EDM_QSM_2002.2.pdf;jsessionid=A03B5B56E0F1BCB404D0E3315FCA27F5?sequence=1">http://apps.who.int/iris/bitstream/handle/10665/67378/WHO_EDM_QSM_2002.2.pdf;jsessionid=A03B5B56E0F1BCB404D0E3315FCA27F5?sequence=1</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="74JWvMVtQ"/></comment> </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Lazarou</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Pomeranz</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Corey</surname>
            <given-names>P</given-names>
          </name>
        </person-group>
        <article-title>Incidence of adverse drug reactions in hospitalized patients: a meta-analysis of prospective studies</article-title>
        <source>JAMA</source>  
        <year>1998</year>  
        <month>04</month>  
        <day>15</day>  
        <volume>279</volume>  
        <issue>15</issue>  
        <fpage>1200</fpage>  
        <lpage>5</lpage>  
        <pub-id pub-id-type="medline">9555760</pub-id>
        <pub-id pub-id-type="pii">jma71005</pub-id></nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Yao</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Zhu</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Jiang</surname>
            <given-names>Q</given-names>
          </name>
          <name name-style="western">
            <surname>Xia</surname>
            <given-names>HA</given-names>
          </name>
        </person-group>
        <article-title>Safety monitoring in clinical trials</article-title>
        <source>Pharmaceutics</source>  
        <year>2013</year>  
        <month>01</month>  
        <day>17</day>  
        <volume>5</volume>  
        <issue>1</issue>  
        <fpage>94</fpage>  
        <lpage>106</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://www.mdpi.com/resolver?pii=pharmaceutics5010094"/>
        </comment>  
        <pub-id pub-id-type="doi">10.3390/pharmaceutics5010094</pub-id>
        <pub-id pub-id-type="medline">24300399</pub-id>
        <pub-id pub-id-type="pii">pharmaceutics5010094</pub-id>
        <pub-id pub-id-type="pmcid">PMC3834937</pub-id></nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Hazell</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Shakir</surname>
            <given-names>SAW</given-names>
          </name>
        </person-group>
        <article-title>Under-reporting of adverse drug reactions : a systematic review</article-title>
        <source>Drug Saf</source>  
        <year>2006</year>  
        <volume>29</volume>  
        <issue>5</issue>  
        <fpage>385</fpage>  
        <lpage>96</lpage>  
        <pub-id pub-id-type="doi">10.2165/00002018-200629050-00003</pub-id>
        <pub-id pub-id-type="medline">16689555</pub-id>
        <pub-id pub-id-type="pii">2953</pub-id></nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Brown</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Kulldorff</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Chan</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Davis</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Graham</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Pettus</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Andrade</surname>
            <given-names>SE</given-names>
          </name>
          <name name-style="western">
            <surname>Raebel</surname>
            <given-names>MA</given-names>
          </name>
          <name name-style="western">
            <surname>Herrinton</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Roblin</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Boudreau</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Smith</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Gurwitz</surname>
            <given-names>JH</given-names>
          </name>
          <name name-style="western">
            <surname>Gunter</surname>
            <given-names>MJ</given-names>
          </name>
          <name name-style="western">
            <surname>Platt</surname>
            <given-names>R</given-names>
          </name>
        </person-group>
        <article-title>Early detection of adverse drug events within population-based health networks: application of sequential testing methods</article-title>
        <source>Pharmacoepidemiol Drug Saf</source>  
        <year>2007</year>  
        <month>12</month>  
        <volume>16</volume>  
        <issue>12</issue>  
        <fpage>1275</fpage>  
        <lpage>84</lpage>  
        <pub-id pub-id-type="doi">10.1002/pds.1509</pub-id>
        <pub-id pub-id-type="medline">17955500</pub-id></nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Naranjo</surname>
            <given-names>CA</given-names>
          </name>
          <name name-style="western">
            <surname>Busto</surname>
            <given-names>U</given-names>
          </name>
          <name name-style="western">
            <surname>Sellers</surname>
            <given-names>EM</given-names>
          </name>
          <name name-style="western">
            <surname>Sandor</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Ruiz</surname>
            <given-names>I</given-names>
          </name>
          <name name-style="western">
            <surname>Roberts</surname>
            <given-names>EA</given-names>
          </name>
          <name name-style="western">
            <surname>Janecek</surname>
            <given-names>E</given-names>
          </name>
          <name name-style="western">
            <surname>Domecq</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Greenblatt</surname>
            <given-names>DJ</given-names>
          </name>
        </person-group>
        <article-title>A method for estimating the probability of adverse drug reactions</article-title>
        <source>Clin Pharmacol Ther</source>  
        <year>1981</year>  
        <month>08</month>  
        <volume>30</volume>  
        <issue>2</issue>  
        <fpage>239</fpage>  
        <lpage>45</lpage>  
        <pub-id pub-id-type="medline">7249508</pub-id></nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Bate</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Lindquist</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Edwards</surname>
            <given-names>IR</given-names>
          </name>
          <name name-style="western">
            <surname>Olsson</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Orre</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Lansner</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>De Freitas</surname>
            <given-names>RM</given-names>
          </name>
        </person-group>
        <article-title>A Bayesian neural network method for adverse drug reaction signal generation</article-title>
        <source>Eur J Clin Pharmacol</source>  
        <year>1998</year>  
        <month>06</month>  
        <volume>54</volume>  
        <issue>4</issue>  
        <fpage>315</fpage>  
        <lpage>21</lpage>  
        <pub-id pub-id-type="medline">9696956</pub-id></nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Nikfarjam</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Sarker</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>O'Connor</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Ginn</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Gonzalez</surname>
            <given-names>G</given-names>
          </name>
        </person-group>
        <article-title>Pharmacovigilance from social media: mining adverse drug reaction mentions using sequence labeling with word embedding cluster features</article-title>
        <source>J Am Med Inform Assoc</source>  
        <year>2015</year>  
        <month>05</month>  
        <volume>22</volume>  
        <issue>3</issue>  
        <fpage>671</fpage>  
        <lpage>81</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/25755127"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1093/jamia/ocu041</pub-id>
        <pub-id pub-id-type="medline">25755127</pub-id>
        <pub-id pub-id-type="pii">ocu041</pub-id>
        <pub-id pub-id-type="pmcid">PMC4457113</pub-id></nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Yang</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Kiang</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Shang</surname>
            <given-names>W</given-names>
          </name>
        </person-group>
        <article-title>Filtering big data from social media--Building an early warning system for adverse drug reactions</article-title>
        <source>J Biomed Inform</source>  
        <year>2015</year>  
        <month>04</month>  
        <volume>54</volume>  
        <fpage>230</fpage>  
        <lpage>40</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(15)00013-1"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1016/j.jbi.2015.01.011</pub-id>
        <pub-id pub-id-type="medline">25688695</pub-id>
        <pub-id pub-id-type="pii">S1532-0464(15)00013-1</pub-id></nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Li</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Salmasian</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Vilar</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Chase</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Friedman</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Wei</surname>
            <given-names>Y</given-names>
          </name>
        </person-group>
        <article-title>A method for controlling complex confounding effects in the detection of adverse drug reactions using electronic health records</article-title>
        <source>J Am Med Inform Assoc</source>  
        <year>2014</year>  
        <volume>21</volume>  
        <issue>2</issue>  
        <fpage>308</fpage>  
        <lpage>14</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/23907285"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1136/amiajnl-2013-001718</pub-id>
        <pub-id pub-id-type="medline">23907285</pub-id>
        <pub-id pub-id-type="pii">amiajnl-2013-001718</pub-id>
        <pub-id pub-id-type="pmcid">PMC3932454</pub-id></nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Karimi</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Wang</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Metke-Jimenez</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Gaire</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Paris</surname>
            <given-names>C</given-names>
          </name>
        </person-group>
        <article-title>Text and Data Mining Techniques in Adverse Drug Reaction Detection</article-title>
        <source>ACM Comput Surv</source>  
        <year>2015</year>  
        <month>07</month>  
        <day>21</day>  
        <volume>47</volume>  
        <issue>4</issue>  
        <fpage>1</fpage>  
        <lpage>39</lpage>  
        <pub-id pub-id-type="doi">10.1145/2719920</pub-id></nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Tatonetti</surname>
            <given-names>NP</given-names>
          </name>
          <name name-style="western">
            <surname>Fernald</surname>
            <given-names>GH</given-names>
          </name>
          <name name-style="western">
            <surname>Altman</surname>
            <given-names>RB</given-names>
          </name>
        </person-group>
        <article-title>A novel signal detection algorithm for identifying hidden drug-drug interactions in adverse event reports</article-title>
        <source>J Am Med Inform Assoc</source>  
        <year>2012</year>  
        <volume>19</volume>  
        <issue>1</issue>  
        <fpage>79</fpage>  
        <lpage>85</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/21676938"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1136/amiajnl-2011-000214</pub-id>
        <pub-id pub-id-type="medline">21676938</pub-id>
        <pub-id pub-id-type="pii">amiajnl-2011-000214</pub-id>
        <pub-id pub-id-type="pmcid">PMC3240755</pub-id></nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Wang</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Jung</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Winnenburg</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Shah</surname>
            <given-names>NH</given-names>
          </name>
        </person-group>
        <article-title>A method for systematic discovery of adverse drug events from clinical notes</article-title>
        <source>J Am Med Inform Assoc</source>  
        <year>2015</year>  
        <month>11</month>  
        <volume>22</volume>  
        <issue>6</issue>  
        <fpage>1196</fpage>  
        <lpage>204</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/26232442"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1093/jamia/ocv102</pub-id>
        <pub-id pub-id-type="medline">26232442</pub-id>
        <pub-id pub-id-type="pii">ocv102</pub-id>
        <pub-id pub-id-type="pmcid">PMC4921953</pub-id></nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Wang</surname>
            <given-names>W</given-names>
          </name>
          <name name-style="western">
            <surname>Haerian</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Salmasian</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Harpaz</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Chase</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Friedman</surname>
            <given-names>C</given-names>
          </name>
        </person-group>
        <article-title>A drug-adverse event extraction algorithm to support pharmacovigilance knowledge mining from PubMed citations</article-title>
        <source>AMIA Annu Symp Proc</source>  
        <year>2011</year>  
        <volume>2011</volume>  
        <fpage>1464</fpage>  
        <lpage>70</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/22195210"/>
        </comment>  
        <pub-id pub-id-type="medline">22195210</pub-id>
        <pub-id pub-id-type="pmcid">PMC3243206</pub-id></nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Finkelstein</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Chen</surname>
            <given-names>Q</given-names>
          </name>
          <name name-style="western">
            <surname>Adams</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Friedman</surname>
            <given-names>C</given-names>
          </name>
        </person-group>
        <article-title>Automated Summarization of Publications Associated with Adverse Drug Reactions from PubMed</article-title>
        <source>AMIA Jt Summits Transl Sci Proc</source>  
        <year>2016</year>  
        <volume>2016</volume>  
        <fpage>68</fpage>  
        <lpage>77</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/27570654"/>
        </comment>  
        <pub-id pub-id-type="medline">27570654</pub-id>
        <pub-id pub-id-type="pmcid">PMC5001779</pub-id></nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Cheng</surname>
            <given-names>F</given-names>
          </name>
          <name name-style="western">
            <surname>Zhao</surname>
            <given-names>Z</given-names>
          </name>
        </person-group>
        <article-title>Machine learning-based prediction of drug-drug interactions by integrating drug phenotypic, therapeutic, chemical, and genomic properties</article-title>
        <source>J Am Med Inform Assoc</source>  
        <year>2014</year>  
        <month>10</month>  
        <volume>21</volume>  
        <issue>e2</issue>  
        <fpage>e278</fpage>  
        <lpage>86</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/24644270"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1136/amiajnl-2013-002512</pub-id>
        <pub-id pub-id-type="medline">24644270</pub-id>
        <pub-id pub-id-type="pii">amiajnl-2013-002512</pub-id>
        <pub-id pub-id-type="pmcid">PMC4173180</pub-id></nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Cami</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Arnold</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Manzi</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Reis</surname>
            <given-names>B</given-names>
          </name>
        </person-group>
        <article-title>Predicting adverse drug events using pharmacological network models</article-title>
        <source>Sci Transl Med</source>  
        <year>2011</year>  
        <month>12</month>  
        <day>21</day>  
        <volume>3</volume>  
        <issue>114</issue>  
        <fpage>114ra127</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://stm.sciencemag.org/cgi/pmidlookup?view=long&amp;pmid=22190238"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1126/scitranslmed.3002774</pub-id>
        <pub-id pub-id-type="medline">22190238</pub-id>
        <pub-id pub-id-type="pii">3/114/114ra127</pub-id></nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Lorberbaum</surname>
            <given-names>T</given-names>
          </name>
          <name name-style="western">
            <surname>Nasir</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Keiser</surname>
            <given-names>MJ</given-names>
          </name>
          <name name-style="western">
            <surname>Vilar</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Hripcsak</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Tatonetti</surname>
            <given-names>NP</given-names>
          </name>
        </person-group>
        <article-title>Systems pharmacology augments drug safety surveillance</article-title>
        <source>Clin Pharmacol Ther</source>  
        <year>2015</year>  
        <month>02</month>  
        <volume>97</volume>  
        <issue>2</issue>  
        <fpage>151</fpage>  
        <lpage>8</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/25670520"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1002/cpt.2</pub-id>
        <pub-id pub-id-type="medline">25670520</pub-id>
        <pub-id pub-id-type="pmcid">PMC4325423</pub-id></nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Huang</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Wu</surname>
            <given-names>X</given-names>
          </name>
          <name name-style="western">
            <surname>Chen</surname>
            <given-names>JY</given-names>
          </name>
        </person-group>
        <article-title>Predicting adverse drug reaction profiles by integrating protein interaction networks with drug structures</article-title>
        <source>Proteomics</source>  
        <year>2013</year>  
        <month>01</month>  
        <volume>13</volume>  
        <issue>2</issue>  
        <fpage>313</fpage>  
        <lpage>24</lpage>  
        <pub-id pub-id-type="doi">10.1002/pmic.201200337</pub-id>
        <pub-id pub-id-type="medline">23184540</pub-id></nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Liu</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Wu</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Chen</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Sun</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Zhao</surname>
            <given-names>Z</given-names>
          </name>
          <name name-style="western">
            <surname>Chen</surname>
            <given-names>X</given-names>
          </name>
          <name name-style="western">
            <surname>Matheny</surname>
            <given-names>ME</given-names>
          </name>
          <name name-style="western">
            <surname>Xu</surname>
            <given-names>H</given-names>
          </name>
        </person-group>
        <article-title>Large-scale prediction of adverse drug reactions using chemical, biological, and phenotypic properties of drugs</article-title>
        <source>J Am Med Inform Assoc</source>  
        <year>2012</year>  
        <month>06</month>  
        <volume>19</volume>  
        <issue>e1</issue>  
        <fpage>e28</fpage>  
        <lpage>35</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/22718037"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1136/amiajnl-2011-000699</pub-id>
        <pub-id pub-id-type="medline">22718037</pub-id>
        <pub-id pub-id-type="pii">amiajnl-2011-000699</pub-id>
        <pub-id pub-id-type="pmcid">PMC3392844</pub-id></nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Kuhn</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Campillos</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Letunic</surname>
            <given-names>I</given-names>
          </name>
          <name name-style="western">
            <surname>Jensen</surname>
            <given-names>LJ</given-names>
          </name>
          <name name-style="western">
            <surname>Bork</surname>
            <given-names>P</given-names>
          </name>
        </person-group>
        <article-title>A side effect resource to capture phenotypic effects of drugs</article-title>
        <source>Mol Syst Biol</source>  
        <year>2010</year>  
        <volume>6</volume>  
        <fpage>343</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://MSB.embopress.org/cgi/pmidlookup?view=long&amp;pmid=20087340"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1038/msb.2009.98</pub-id>
        <pub-id pub-id-type="medline">20087340</pub-id>
        <pub-id pub-id-type="pii">msb200998</pub-id>
        <pub-id pub-id-type="pmcid">PMC2824526</pub-id></nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Kuhn</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Letunic</surname>
            <given-names>I</given-names>
          </name>
          <name name-style="western">
            <surname>Jensen</surname>
            <given-names>LJ</given-names>
          </name>
          <name name-style="western">
            <surname>Bork</surname>
            <given-names>P</given-names>
          </name>
        </person-group>
        <article-title>The SIDER database of drugs and side effects</article-title>
        <source>Nucleic Acids Res</source>  
        <year>2016</year>  
        <month>01</month>  
        <day>04</day>  
        <volume>44</volume>  
        <issue>D1</issue>  
        <fpage>D1075</fpage>  
        <lpage>9</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/26481350"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1093/nar/gkv1075</pub-id>
        <pub-id pub-id-type="medline">26481350</pub-id>
        <pub-id pub-id-type="pii">gkv1075</pub-id>
        <pub-id pub-id-type="pmcid">PMC4702794</pub-id></nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Chen</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Wild</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Guha</surname>
            <given-names>D</given-names>
          </name>
        </person-group>
        <article-title>PubChem as a source of polypharmacology</article-title>
        <source>J Chem Inf Model</source>  
        <year>2009</year>  
        <month>09</month>  
        <volume>49</volume>  
        <issue>9</issue>  
        <fpage>2044</fpage>  
        <lpage>55</lpage>  
        <pub-id pub-id-type="doi">10.1021/ci9001876</pub-id>
        <pub-id pub-id-type="medline">19708682</pub-id></nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Wishart</surname>
            <given-names>DS</given-names>
          </name>
          <name name-style="western">
            <surname>Feunang</surname>
            <given-names>YD</given-names>
          </name>
          <name name-style="western">
            <surname>Guo</surname>
            <given-names>AC</given-names>
          </name>
          <name name-style="western">
            <surname>Lo</surname>
            <given-names>EJ</given-names>
          </name>
          <name name-style="western">
            <surname>Marcu</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Grant</surname>
            <given-names>JR</given-names>
          </name>
          <name name-style="western">
            <surname>Sajed</surname>
            <given-names>T</given-names>
          </name>
          <name name-style="western">
            <surname>Johnson</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Li</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Sayeeda</surname>
            <given-names>Z</given-names>
          </name>
          <name name-style="western">
            <surname>Assempour</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>Iynkkaran</surname>
            <given-names>I</given-names>
          </name>
          <name name-style="western">
            <surname>Liu</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Maciejewski</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Gale</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>Wilson</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Chin</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Cummings</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Le</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Pon</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Knox</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Wilson</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <article-title>DrugBank 5.0: a major update to the DrugBank database for 2018</article-title>
        <source>Nucleic Acids Res</source>  
        <year>2018</year>  
        <month>01</month>  
        <day>04</day>  
        <volume>46</volume>  
        <issue>D1</issue>  
        <fpage>D1074</fpage>  
        <lpage>D1082</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/29126136"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1093/nar/gkx1037</pub-id>
        <pub-id pub-id-type="medline">29126136</pub-id>
        <pub-id pub-id-type="pii">4602867</pub-id>
        <pub-id pub-id-type="pmcid">PMC5753335</pub-id></nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Srinivasan</surname>
            <given-names>P</given-names>
          </name>
        </person-group>
        <article-title>Text mining: Generating hypotheses from MEDLINE</article-title>
        <source>J Am Soc Inf Sci</source>  
        <year>2004</year>  
        <month>03</month>  
        <volume>55</volume>  
        <issue>5</issue>  
        <fpage>396</fpage>  
        <lpage>413</lpage>  
        <pub-id pub-id-type="doi">10.1002/asi.10389</pub-id></nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Mikolov</surname>
            <given-names>T</given-names>
          </name>
          <name name-style="western">
            <surname>Chen</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Corrado</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Dean</surname>
            <given-names>J</given-names>
          </name>
        </person-group>
        <article-title>Efficient Estimation of Word Representations in Vector Space</article-title>
        <source>arXiv preprint arXiv:1301.3781</source>  
        <year>2013</year>  
        <month>1</month>  
        <day>16</day>  
        <fpage>-</fpage>  
        <pub-id pub-id-type="doi">10.1109/TNN.2003.820440</pub-id>
        <pub-id pub-id-type="medline">18244602</pub-id></nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Le</surname>
            <given-names>QV</given-names>
          </name>
          <name name-style="western">
            <surname>Mikolov</surname>
            <given-names>T</given-names>
          </name>
        </person-group>
        <article-title>Distributed Representations of Sentences and Documents</article-title>
        <year>2014</year>  
        <conf-name>ICML'14 Proceedings of the 31st International Conference on International Conference on Machine Learning</conf-name>
        <conf-date>June 21-26, 2014</conf-date>
        <conf-loc>Beijing, China</conf-loc>
        <fpage>1188</fpage>  
        <lpage>1196</lpage> </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal"> <person-group person-group-type="author"> <name name-style="western"> <surname>Bojanowski</surname> <given-names>P</given-names> </name> <name name-style="western"> <surname>Grave</surname> <given-names>E</given-names> </name> <name name-style="western"> <surname>Joulin</surname> <given-names>A</given-names> </name> <name name-style="western"> <surname>Mikolov</surname> <given-names>T</given-names> </name> </person-group> <article-title>Enriching Word Vectors with Subword Information</article-title> <source>Transactions of the Association for Computational Linguistics</source> <year>2017</year> <month>12</month> <volume>5</volume> <fpage>135</fpage> <lpage>146</lpage> <comment><ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/1607.04606"/></comment> <pub-id pub-id-type="doi">10.1162/tacl_a_00051</pub-id> </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Sugawara</surname>
            <given-names>E</given-names>
          </name>
          <name name-style="western">
            <surname>Nikaido</surname>
            <given-names>H</given-names>
          </name>
        </person-group>
        <article-title>Properties of AdeABC and AdeIJK efflux systems of Acinetobacter baumannii compared with those of the AcrAB-TolC system of Escherichia coli</article-title>
        <source>Antimicrob Agents Chemother</source>  
        <year>2014</year>  
        <month>12</month>  
        <volume>58</volume>  
        <issue>12</issue>  
        <fpage>7250</fpage>  
        <lpage>7</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://aac.asm.org/cgi/pmidlookup?view=long&amp;pmid=25246403"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1128/AAC.03728-14</pub-id>
        <pub-id pub-id-type="medline">25246403</pub-id>
        <pub-id pub-id-type="pii">AAC.03728-14</pub-id>
        <pub-id pub-id-type="pmcid">PMC4249520</pub-id></nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Tibshirani</surname>
            <given-names>R</given-names>
          </name>
        </person-group>
        <article-title>Regression shrinkage and selection via the lasso: a retrospective</article-title>
        <source>J R Statist Soc B</source>  
        <year>2011</year>  
        <volume>73</volume>  
        <fpage>273</fpage>  
        <lpage>282</lpage> </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Singhal</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Simmons</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Lu</surname>
            <given-names>Z</given-names>
          </name>
        </person-group>
        <article-title>Text mining for precision medicine: automating disease-mutation relationship extraction from biomedical literature</article-title>
        <source>J Am Med Inform Assoc</source>  
        <year>2016</year>  
        <month>12</month>  
        <volume>23</volume>  
        <issue>4</issue>  
        <fpage>766</fpage>  
        <lpage>72</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/27121612"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1093/jamia/ocw041</pub-id>
        <pub-id pub-id-type="medline">27121612</pub-id>
        <pub-id pub-id-type="pii">ocw041</pub-id>
        <pub-id pub-id-type="pmcid">PMC4926749</pub-id></nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="web"> <person-group person-group-type="author"> <name name-style="western"> <surname>Hinton</surname> <given-names>G</given-names> </name> <name name-style="western"> <surname>Srivastava</surname> <given-names>N</given-names> </name> <name name-style="western"> <surname>Krizhevsky</surname> <given-names>A</given-names> </name> <name name-style="western"> <surname>Sutskever</surname> <given-names>I</given-names> </name> <name name-style="western"> <surname>Salakhutdinov</surname> <given-names>R</given-names> </name> </person-group> <source>Improving neural networks by preventing co-adaptation of feature detectors</source> <year>2012</year> <month>6</month> <day>3</day> <comment><ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/pdf/1207.0580.pdf">https://arxiv.org/pdf/1207.0580.pdf</ext-link> <ext-link ext-link-type="webcite" xlink:href="75xhdRuMY"/> </comment> </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Srivastava</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>Hinton</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Krizhevsky</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Sutskever</surname>
            <given-names>I</given-names>
          </name>
          <name name-style="western">
            <surname>Salakhutdinov</surname>
            <given-names>R</given-names>
          </name>
        </person-group>
        <article-title>Learning to detect cells using non-overlapping extremal regions</article-title>
        <source>The Journal of Machine Learning Research</source>  
        <year>2014</year>  
        <month>01</month>  
        <volume>15</volume>  
        <issue>1</issue>  
        <fpage>348</fpage>  
        <lpage>56</lpage>  
        <pub-id pub-id-type="medline">23285570</pub-id></nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Ruta</surname>
            <given-names>D</given-names>
          </name>
        </person-group>
        <article-title>Robust method of sparse feature selection for multi-label classification with Naive Bayes</article-title>
        <year>2014</year>  
        <conf-name>Federated Conference on Computer Science and Information Systems, FedCSIS</conf-name>
        <conf-date>September 2014</conf-date>
        <conf-loc>Warsaw, Poland</conf-loc>
        <fpage>380</fpage>  
        <pub-id pub-id-type="doi">10.15439/2014F502</pub-id></nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Pinto</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Costa</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Camacho</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Costa</surname>
            <given-names>V.S</given-names>
          </name>
        </person-group>
        <article-title>Predicting drugs adverse side-effects using a recommender-system</article-title>
        <source>Springer</source>  
        <year>2015</year>  
        <conf-name>International Conference on Discovery Science</conf-name>
        <conf-date>4-6 October</conf-date>
        <conf-loc>Banff, Canada</conf-loc>
        <fpage>201</fpage>  
        <lpage>208</lpage> </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
