<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMIR</journal-id>
      <journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id>
      <journal-title>Journal of Medical Internet Research</journal-title>
      <issn pub-type="epub">1438-8871</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v24i7e37233</article-id>
      <article-id pub-id-type="pmid">35838763</article-id>
      <article-id pub-id-type="doi">10.2196/37233</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Drug Recommendation System for Diabetes Using a Collaborative Filtering and Clustering Approach: Development and Performance Evaluation</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Kukafka</surname>
            <given-names>Rita</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Benis</surname>
            <given-names>Arriel</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Uludag</surname>
            <given-names>Kadir</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author">
          <name name-style="western">
            <surname>Granda Morales</surname>
            <given-names>Luis Fernando</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-2378-8841</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Valdiviezo-Diaz</surname>
            <given-names>Priscila</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Departamento de Ciencias de la Computación y Electrónica</institution>
            <institution>Universidad Técnica Particular de Loja</institution>
            <addr-line>San Cayetano Alto</addr-line>
            <addr-line>Loja, 1101608</addr-line>
            <country>Ecuador</country>
            <phone>593 7 3701444 ext 2325</phone>
            <email>pmvaldiviezo@utpl.edu.ec</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-5216-8820</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Reátegui</surname>
            <given-names>Ruth</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-7304-4413</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Barba-Guaman</surname>
            <given-names>Luis</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-8569-3322</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Departamento de Ciencias de la Computación y Electrónica</institution>
        <institution>Universidad Técnica Particular de Loja</institution>
        <addr-line>Loja</addr-line>
        <country>Ecuador</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Priscila Valdiviezo-Diaz <email>pmvaldiviezo@utpl.edu.ec</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <month>7</month>
        <year>2022</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>15</day>
        <month>7</month>
        <year>2022</year>
      </pub-date>
      <volume>24</volume>
      <issue>7</issue>
      <elocation-id>e37233</elocation-id>
      <history>
        <date date-type="received">
          <day>11</day>
          <month>2</month>
          <year>2022</year>
        </date>
        <date date-type="rev-request">
          <day>5</day>
          <month>4</month>
          <year>2022</year>
        </date>
        <date date-type="rev-recd">
          <day>18</day>
          <month>4</month>
          <year>2022</year>
        </date>
        <date date-type="accepted">
          <day>29</day>
          <month>5</month>
          <year>2022</year>
        </date>
      </history>
      <copyright-statement>©Luis Fernando Granda Morales, Priscila Valdiviezo-Diaz, Ruth Reátegui, Luis Barba-Guaman. Originally published in the Journal of Medical Internet Research (https://www.jmir.org), 15.07.2022.</copyright-statement>
      <copyright-year>2022</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research, is properly cited. The complete bibliographic information, a link to the original publication on https://www.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://www.jmir.org/2022/7/e37233" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Diabetes is a public health problem worldwide. Although diabetes is a chronic and incurable disease, measures and treatments can be taken to control it and keep the patient stable. Diabetes has been the subject of extensive research, ranging from disease prevention to the use of technologies for its diagnosis and control. Health institutions obtain information required for the diagnosis of diabetes through various tests, and appropriate treatment is provided according to the diagnosis. These institutions have databases with large volumes of information that can be analyzed and used in different applications such as pattern discovery and outcome prediction, which can help health personnel in making decisions about treatments or determining the appropriate  prescriptions for diabetes management.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>The aim of this study was to develop a drug recommendation system for patients with diabetes based on collaborative filtering and clustering techniques as a complement to the treatments given by the treating doctor.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>The data set used contains information from patients with diabetes available in the University of California Irvine Machine Learning Repository. Data mining techniques were applied for processing and analysis of the data set. Unsupervised learning techniques were used for dimensionality reduction and patient clustering. Drug predictions were obtained with a user-based collaborative filtering approach, which enabled creating a patient profile that can be compared with the profiles of other patients with similar characteristics. Finally, recommendations were made considering the identified patient groups. The performance of the system was evaluated using metrics to assess the quality of the groups and the quality of the predictions and recommendations.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>Principal component analysis to reduce the dimensionality of the data showed that eight components best explained the variability of the data. We identified six groups of patients using the clustering algorithm, which were evenly distributed. These groups were identified based on the available information of patients with diabetes, and then the variation between groups was examined to predict a suitable medication for a target patient. The recommender system achieved good results in the quality of predictions with a mean squared error metric of 0.51 and accuracy in the quality of recommendations of 0.61, which is acceptable.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>This work presents a recommendation system that suggests medications according to drug information and the characteristics of patients with diabetes. Some aspects related to this disease were analyzed based on the data set used from patients with diabetes. The experimental results with clustering and prediction techniques were found to be acceptable for the recommendation process. This system can provide a novel perspective for health institutions that require technologies to support health care personnel in the management of diabetes treatment and control.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>clustering</kwd>
        <kwd>collaborative filtering</kwd>
        <kwd>diabetes</kwd>
        <kwd>recommender system</kwd>
        <kwd>recommend</kwd>
        <kwd>drug</kwd>
        <kwd>chronic disease</kwd>
        <kwd>patient information</kwd>
        <kwd>data mining</kwd>
        <kwd>machine learning</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <sec>
        <title>Background</title>
        <p>Owing to the large amount of information available in health institution databases, including medical treatments, diagnostic tests, clinical histories, and drug characteristics, there is a need to implement recommender systems (RSs) that support medical staff in activities related to health control and management. The main concept of an RS is to suggest items that are particularly suitable for the user based on their profile or historical preferences. In the context of health, these items can be drugs, medical treatments, health videos, and patients sharing the same disease. An RS employs data sources to learn about user preferences through machine-learning algorithms and information-filtering techniques such as content-based, collaborative filtering–based, demographic, and hybrid approaches [<xref ref-type="bibr" rid="ref1">1</xref>].</p>
        <p>Currently, more than 80% of internet users seek health information through various platforms, including social networks, a figure that, according to De Choudhur et al [<xref ref-type="bibr" rid="ref2">2</xref>], continues to grow. Through the internet, users can identify patients with the same disease, the possible causes of their ailments, find procedures to alleviate a particular disease, learn new healthy habits, and find general health information [<xref ref-type="bibr" rid="ref3">3</xref>-<xref ref-type="bibr" rid="ref5">5</xref>].</p>
        <p>In the case of chronic diseases such as diabetes, the prescription of multiple drugs is common; thus, RSs can support the intervention of the treating doctor in determining which drugs to prescribe to a particular patient. Considering the current health status of a patient, their clinical history, medications prescribed in previous periods, specific symptoms, and other characteristics, the system can search for patients with similar parameters in the database and suggest drugs that have been more successful in these cases, which could be recommended to the target patient.</p>
        <p>Some research has been performed on RSs in the health area. For example, Zhang et al [<xref ref-type="bibr" rid="ref6">6</xref>] proposed the iDoctor system to provide users with personalized medical recommendations. This system explores users’ emotions and preferences about doctors through their ratings and reviews. Gujar et al [<xref ref-type="bibr" rid="ref7">7</xref>] proposed data-mining techniques for the prediction of a disease and to make a recommendation for specialists about the predicted disease. Kuanr et al [<xref ref-type="bibr" rid="ref8">8</xref>] proposed an RS for cervical cancer in which predictive models showed high accuracy. Poornima [<xref ref-type="bibr" rid="ref9">9</xref>] presented a daily nutrition RS for women taking into consideration physical data, preferences, and personal information to combat diseases such as malnutrition, obesity, and cardiovascular diseases.</p>
        <p>Other research has focused primarily on recommending doctors and hospitals that are best suited to a specific patient profile [<xref ref-type="bibr" rid="ref10">10</xref>], medication recommendations [<xref ref-type="bibr" rid="ref11">11</xref>], treatment recommendations for patients over time [<xref ref-type="bibr" rid="ref12">12</xref>], videos about health [<xref ref-type="bibr" rid="ref13">13</xref>], and even customized meal plans [<xref ref-type="bibr" rid="ref14">14</xref>].</p>
        <p>Recently, several studies related to the use of RSs in diabetes have emerged, including some exploratory analyses on the disease, predictions on diet plans to combat obesity and diabetes [<xref ref-type="bibr" rid="ref14">14</xref>], and physical activity and diet plan RSs to help prevent chronic diseases [<xref ref-type="bibr" rid="ref15">15</xref>].</p>
        <p>Clustering is one of the most widely used machine-learning techniques in the field of health to identify patterns or groups of patients with similar characteristics [<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref17">17</xref>]. Although the clustering technique has been the subject of research in the area of RSs, these systems have not yet been widely used in medicine. Moreover, technologies that enable only the analysis or prediction of diagnoses or diseases would not be sufficient to provide personalized care to the patient or to support health personnel in making decisions about which drugs to consider for certain diseases. Therefore, we here propose a drug RS for patients with diabetes based on clustering techniques as a complement to the treatments given by the treating doctor.</p>
        <p>Both drug predictions and recommendations were evaluated using traditional metrics to measure the performance of the RS.</p>
      </sec>
      <sec>
        <title>Contribution</title>
        <p>The aim of this study was to complement previous diabetes-related studies by first analyzing data related to patients with diabetes to obtain important information for the management of this disease, followed by identifying groups of patients who share similar characteristics, which could enable discovering patterns of interest that can support decision-making. Finally, an RS was developed that suggests medications for diabetes according to the patient’s historical information and the doses of the medications administered.</p>
      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Data Set</title>
        <p>The data set used was obtained from the University of California Irvine (UCI) Machine Learning Repository [<xref ref-type="bibr" rid="ref18">18</xref>], which contains information on patients with diseases associated with diabetes [<xref ref-type="bibr" rid="ref19">19</xref>]. The original data set includes more than 50 features representing patient outcomes from 130 US hospitals. This data set has more than 100,000 patient records, which refer to 10 years of health care records (from 1999 to 2008).</p>
        <p>In summary, the information contained in the data set refers to: admissions of patients to the hospital; information on 24 medications administered to patients with diabetes; changes in the patients’ medication, and whether the dosage was increased, reduced, kept stable, or not administered; number of medications administered to the patient; time spent by the patient in the hospital, recorded in days; results of tests that were indicated to patients prior to and during their treatment; diagnosis; type of admission; specialty of the treating doctor; and patient data such as age, race, and gender.</p>
      </sec>
      <sec>
        <title>Exploratory Data Analysis</title>
        <p>Exploratory analysis of the data set is a critical process in research to discover patterns, detect anomalies, test hypotheses, and test assumptions with the help of statistics and graphical representations. It is good practice to first understand the data to obtain as much information as possible.</p>
        <p>Toward this end, in the initial analysis of the patient data, we determined that most of the patients belong to the age range of 50 to 80 years, and we classified patients according to readmission status (ie, if the patient presents a case of readmission greater than or less than 30 days, and no readmission). <xref rid="figure1" ref-type="fig">Figure 1</xref> shows the relationship between age and patient readmission, demonstrating very few cases of readmission for younger patients (under 40 years of age). In addition, women had a slightly higher readmission rate than men in cases of readmission longer than 30 days. Readmission showed a similar distribution for patients with and without medication prescribed for diabetes prior to hospital treatment. In addition, we determined that the majority of the patients were of the Caucasian race and did not have a glucose or hemoglobin A1C test.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Distribution of patients according to age and readmission.</p>
          </caption>
          <graphic xlink:href="jmir_v24i7e37233_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Data Preparation</title>
        <sec>
          <title>Overview</title>
          <p>Data preparation, also known as preprocessing, is a key task in the initial stages to ensure a correct analysis of the information available. Before applying the clustering techniques, the original data set was cleaned by removing all duplicated cases of patients and eliminating records of patients who had not been prescribed any medication. We then performed data transformation and variable selection.</p>
        </sec>
        <sec>
          <title>Data Transformation</title>
          <p>The data transformation process generally involves converting variables to another type of data and creating new variables. In our case, we converted categorical variables to binary variables, such as gender, maximum glucose serum level, and hemoglobin A1C test result.</p>
          <p>New variables were created from the categories of the first diagnosis variable, which was coded according to the first three digits of the International Classification of Diseases-9 system: circulatory, diabetes, digestive, genitourinary, injuries, musculoskeletal, neoplasms, respiratory, and other. The categories of the race variable were created as new variables. Subsequently, the first diagnosis and race variables were removed from the data set. In addition, the age ranges were replaced by the mean of the ranges.</p>
        </sec>
        <sec>
          <title>Variable Selection</title>
          <p>Noninformative features in the data set were discarded due to a large number of missing values (50,000/100,000, 50.00%) or because some features were not relevant to classifying the data, such as patient identification, or if the feature is unbalanced (n=95,000, &#62;95% of the data had the same value for a feature). In addition, we selected patients who had been prescribed at least two medications. <xref ref-type="table" rid="table1">Table 1</xref> lists the discarded parameters (features) and the reasons for discarding them.</p>
          <p>As a result, a final data set was obtained with 5177 unique patient records and 42 variables, which were categorized as patient characteristics and medications administered to patients. These final attributes are detailed in <xref ref-type="table" rid="table2">Table 2</xref> and <xref ref-type="table" rid="table3">Table 3</xref>, respectively.</p>
          <p>Drugs whose administration represented a very small percentage (500/100,000, 0.50%) or drugs that had not been administered to any patient (as was the case for examide and cytoglipton) were eliminated. <xref ref-type="table" rid="table3">Table 3</xref> lists the drugs selected after data processing and the number and proportions of patients using the drug.</p>
          <p>For each drug, we classified whether it was administered or if there was a change in the dose. We considered four values for this variable: “up” indicates that the dose was increased during the patient encounter, “down” indicates that the dose was decreased, “steady” indicates that the dose did not change, and “no” indicates that the drug was not administered.</p>
          <p>As shown in <xref ref-type="table" rid="table3">Table 3</xref>, insulin was administered to more than 50% of the patients present in our data set, metformin was administered to slightly less than 20% of the patients, followed by glipizide and glyburide. The drugs that were administered to fewer patients were glyburide-metformin and nateglinide.</p>
          <table-wrap position="float" id="table1">
            <label>Table 1</label>
            <caption>
              <p>Variables discarded from the data set.</p>
            </caption>
            <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
              <col width="500"/>
              <col width="500"/>
              <thead>
                <tr valign="top">
                  <td>Variable</td>
                  <td>Discard reason</td>
                </tr>
              </thead>
              <tbody>
                <tr valign="top">
                  <td>encounter_id<sup>a</sup></td>
                  <td>Irrelevant variable for clustering</td>
                </tr>
                <tr valign="top">
                  <td>patient_nbr<sup>b</sup></td>
                  <td>Irrelevant variable for clustering</td>
                </tr>
                <tr valign="top">
                  <td>payer_code<sup>c</sup></td>
                  <td>Irrelevant variable for clustering</td>
                </tr>
                <tr valign="top">
                  <td>Weight</td>
                  <td>Data missing for 97.00% (n=97,000) of the 100,000 samples</td>
                </tr>
                <tr valign="top">
                  <td>Medical specialty</td>
                  <td>Data missing for 53.00% (n=53,000) of the 100,000 samples</td>
                </tr>
                <tr valign="top">
                  <td>Clorpropamida</td>
                  <td>Only 86 patients use this drug</td>
                </tr>
                <tr valign="top">
                  <td>Acarbosa</td>
                  <td>Only 308 patients use this drug</td>
                </tr>
                <tr valign="top">
                  <td>Miglitol</td>
                  <td>Only 38 patients use this drug</td>
                </tr>
                <tr valign="top">
                  <td>Troglitazona</td>
                  <td>Only 3 patients use this drug</td>
                </tr>
                <tr valign="top">
                  <td>Examide</td>
                  <td>No patient uses this drug</td>
                </tr>
                <tr valign="top">
                  <td>Citoglipton</td>
                  <td>No patient uses this drug</td>
                </tr>
                <tr valign="top">
                  <td>Glipizide_metformin</td>
                  <td>Only 13 patients use this drug</td>
                </tr>
                <tr valign="top">
                  <td>Glimepirida_pioglitazona</td>
                  <td>Only 1 patient uses this drug</td>
                </tr>
                <tr valign="top">
                  <td>Metformin_rosiglitazone</td>
                  <td>Only 2 patients use this drug</td>
                </tr>
                <tr valign="top">
                  <td>Metformina_pioglitazona</td>
                  <td>Only 1 patient uses this drug</td>
                </tr>
                <tr valign="top">
                  <td>Acetohexamida</td>
                  <td>Only 1 patient uses this drug</td>
                </tr>
                <tr valign="top">
                  <td>Tolbutamide</td>
                  <td>Only 23 patients use this drug</td>
                </tr>
                <tr valign="top">
                  <td>Tolazamide</td>
                  <td>Only 39 patients use this drug</td>
                </tr>
              </tbody>
            </table>
            <table-wrap-foot>
              <fn id="table1fn1">
                <p><sup>a</sup>encounter_id: Identification of a specific hospital visit or patient encounter.</p>
              </fn>
              <fn id="table1fn2">
                <p><sup>b</sup>patient_nbr: patient ID number.</p>
              </fn>
              <fn id="table1fn3">
                <p><sup>c</sup>payer_code: identifier corresponding to 23 distinct values of payment method (eg, Blue Cross<italic>/</italic>Blue Shield, Medicare, patient payment).</p>
              </fn>
            </table-wrap-foot>
          </table-wrap>
          <table-wrap position="float" id="table2">
            <label>Table 2</label>
            <caption>
              <p>Patient characteristics, description, and their corresponding values.</p>
            </caption>
            <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
              <col width="300"/>
              <col width="500"/>
              <col width="200"/>
              <thead>
                <tr valign="top">
                  <td>Variable</td>
                  <td>Description</td>
                  <td>Values</td>
                </tr>
              </thead>
              <tbody>
                <tr valign="top">
                  <td>Gender</td>
                  <td>Patient gender (self-identified)</td>
                  <td>0, 1</td>
                </tr>
                <tr valign="top">
                  <td>Age</td>
                  <td>Patient age (years)</td>
                  <td>5, 15, 25, 35, 45,…95</td>
                </tr>
                <tr valign="top">
                  <td>admission_type_id</td>
                  <td>Identifier corresponding to 8 different types of admissions: emergencies, accidents, newborns, and others</td>
                  <td>1-8</td>
                </tr>
                <tr valign="top">
                  <td>discharge_disposition_id</td>
                  <td>Identifier of the discharge type (eg, discharged to home, psychiatric hospital, medical facility)</td>
                  <td>1-28</td>
                </tr>
                <tr valign="top">
                  <td>admission_source_id</td>
                  <td>Identifier of the admission source (eg, transfer from hospice, transfer from an ambulatory surgery center)</td>
                  <td>1-11, 13-14, 20, 22, 25</td>
                </tr>
                <tr valign="top">
                  <td>time_in_hospital</td>
                  <td>Number of days between admission and discharge</td>
                  <td>1-14</td>
                </tr>
                <tr valign="top">
                  <td>num_lab_procedures</td>
                  <td>Number of laboratory tests performed during the encounter</td>
                  <td>1-132</td>
                </tr>
                <tr valign="top">
                  <td>num_procedures</td>
                  <td>Number of procedures performed during the encounter</td>
                  <td>0-6</td>
                </tr>
                <tr valign="top">
                  <td>num_medications</td>
                  <td>Number of different drugs (generic names) administered during the encounter</td>
                  <td>1-81</td>
                </tr>
                <tr valign="top">
                  <td>number_outpatient</td>
                  <td>Number of outpatient visits</td>
                  <td>0-42</td>
                </tr>
                <tr valign="top">
                  <td>number_emergency</td>
                  <td>Number of emergency visits</td>
                  <td>0-76</td>
                </tr>
                <tr valign="top">
                  <td>number_inpatient</td>
                  <td>Number of inpatient visits</td>
                  <td>0-21</td>
                </tr>
                <tr valign="top">
                  <td>number_diagnoses</td>
                  <td>Number of diagnoses</td>
                  <td>1-16</td>
                </tr>
                <tr valign="top">
                  <td>max_glu_serum</td>
                  <td>Range of the result of the serum glucose level or if the test was not performed</td>
                  <td>0, 1</td>
                </tr>
                <tr valign="top">
                  <td>a1cresult</td>
                  <td>Range of the result of the hemoglobin A1C level or if the test was not performed</td>
                  <td>0, 1</td>
                </tr>
                <tr valign="top">
                  <td>change</td>
                  <td>If there is a change in medication</td>
                  <td>0, 1</td>
                </tr>
                <tr valign="top">
                  <td>diabetesmed</td>
                  <td>If the patient has been prescribed medication for diabetes</td>
                  <td>0, 1</td>
                </tr>
                <tr valign="top">
                  <td>readmitted</td>
                  <td>Days to inpatient readmission; these categories will be relabeled</td>
                  <td>0, 1, 2</td>
                </tr>
                <tr valign="top">
                  <td>African American, Asian, Caucasian, Hispanic, Other</td>
                  <td>Patient’s race</td>
                  <td>0, 1</td>
                </tr>
                <tr valign="top">
                  <td>circulatory</td>
                  <td>If the patient is admitted with circulatory system problems, the variable takes the value of 1</td>
                  <td>0, 1</td>
                </tr>
                <tr valign="top">
                  <td>diabetes</td>
                  <td>If the patient is admitted with diabetes-related problems, the variable takes the value of 1</td>
                  <td>0, 1</td>
                </tr>
                <tr valign="top">
                  <td>digestive</td>
                  <td>If the patient is admitted with digestive system problems, the variable takes the value of 1</td>
                  <td>0, 1</td>
                </tr>
                <tr valign="top">
                  <td>genitourinary</td>
                  <td>If the patient is admitted with genitourinary problems, the variable takes the value of 1</td>
                  <td>0, 1</td>
                </tr>
                <tr valign="top">
                  <td>injury</td>
                  <td>If the patient is admitted with injuries, the variable takes the value of 1</td>
                  <td>0, 1</td>
                </tr>
                <tr valign="top">
                  <td>musculoskeletal</td>
                  <td>If the patient is admitted with musculoskeletal problems, the variable takes the value of 1</td>
                  <td>0, 1</td>
                </tr>
                <tr valign="top">
                  <td>neoplasms</td>
                  <td>If the patient is admitted with neoplasms, the variable takes the value of 1</td>
                  <td>0, 1</td>
                </tr>
                <tr valign="top">
                  <td>respiratory</td>
                  <td>If the patient is admitted with respiratory system problems, the variable takes the value of 1</td>
                  <td>0, 1</td>
                </tr>
                <tr valign="top">
                  <td>other2</td>
                  <td>If the patient is admitted with other complications, the variable takes the value of 1</td>
                  <td>0, 1</td>
                </tr>
              </tbody>
            </table>
          </table-wrap>
          <table-wrap position="float" id="table3">
            <label>Table 3</label>
            <caption>
              <p>Final drugs used in the data set among 24 total drugs (N=100,000 patients).<sup>a</sup></p>
            </caption>
            <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
              <col width="500"/>
              <col width="500"/>
              <thead>
                <tr valign="top">
                  <td>Drug</td>
                  <td>Patients, n (%)</td>
                </tr>
              </thead>
              <tbody>
                <tr valign="top">
                  <td>Insulin</td>
                  <td>54,383 (53.44)</td>
                </tr>
                <tr valign="top">
                  <td>Metformin</td>
                  <td>19,988 (19.99)</td>
                </tr>
                <tr valign="top">
                  <td>Glipizide</td>
                  <td>12,686 (12.69)</td>
                </tr>
                <tr valign="top">
                  <td>Glyburide</td>
                  <td>10,650 (10.65)</td>
                </tr>
                <tr valign="top">
                  <td>Pioglitazone</td>
                  <td>7328 (7.33)</td>
                </tr>
                <tr valign="top">
                  <td>Rosiglitazone</td>
                  <td>6365 (6.37)</td>
                </tr>
                <tr valign="top">
                  <td>Glimepiride</td>
                  <td>5191 (5.19)</td>
                </tr>
                <tr valign="top">
                  <td>Repaglinide</td>
                  <td>1539 (1.54)</td>
                </tr>
                <tr valign="top">
                  <td>Glyburide-metformin</td>
                  <td>706 (0.71)</td>
                </tr>
                <tr valign="top">
                  <td>Nateglinide</td>
                  <td>703 (0.70)</td>
                </tr>
              </tbody>
            </table>
            <table-wrap-foot>
              <fn id="table3fn1">
                <p><sup>a</sup>Some patients were administered more than one drug.</p>
              </fn>
            </table-wrap-foot>
          </table-wrap>
        </sec>
      </sec>
      <sec>
        <title>Clustering-Based Recommendation</title>
        <sec>
          <title>General Approach</title>
          <p>The proposed RS is based on the collaborative filtering approach to represent the drugs prescribed to each patient according to the dose given. The clustering technique was applied to group patients with similar characteristics.</p>
          <p><xref rid="figure2" ref-type="fig">Figure 2</xref> shows a schematic of our proposed method, where the relationship between the elements of the system can be appreciated. The patient’s information is first obtained from the data set, such as clinical history, treatments, and the medication prescribed, and then the data are further processed for the application of clustering algorithms. The collaborative filtering technique is then applied to represent the patient’s explicit data (user-medication-dose). According to the group to which the patient belongs, the prediction of the medications is made. Finally, the recommendation is made considering the drugs with the highest prediction value.</p>
          <fig id="figure2" position="float">
            <label>Figure 2</label>
            <caption>
              <p>Schematic of the proposed recommendation approach.</p>
            </caption>
            <graphic xlink:href="jmir_v24i7e37233_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
        <sec>
          <title>Patient Grouping</title>
          <p>To obtain the patient groups, we tested two clustering algorithms to determine the algorithm that provides the best result: the partitional K-means algorithm and the density-based spatial clustering of applications with noise (DBSCAN) algorithm. For this process, it was first necessary to normalize the data and reduce the dimensionality of the data set using principal component analysis (PCA). The optimal number of clusters was determined using the Silhouette coefficient. Patients sharing the same characteristics will be part of the same cluster.</p>
          <p>The results of both clustering algorithms were compared using the value of the Silhouette coefficient obtained.</p>
        </sec>
        <sec>
          <title>Drug Prediction</title>
          <p>For calculation of the prediction performance, we randomly divided the data set into two parts: 80.00% (4142/5177) for training the algorithm and the remaining 20.00% (1035/5177) for testing.</p>
          <p>The collaborative filtering approach requires users, items, and ratings; in our case, these elements were replaced by patients, drugs, and drug dosage, respectively, where a value of 1 means that the patient’s drug dosage was decreased and a value of 2 means that the drug dosage was increased. With these elements, we proceeded to the construction of the collaborative filtering matrix, as shown in <xref ref-type="table" rid="table4">Table 4</xref>.</p>
          <p>The matrix was completed with the prediction of the drug dose value for the patients in each cluster, which was calculated by applying the cosine similarity measure for each of the clusters.</p>
          <table-wrap position="float" id="table4">
            <label>Table 4</label>
            <caption>
              <p>Collaborative filtering matrix.</p>
            </caption>
            <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
              <col width="250"/>
              <col width="150"/>
              <col width="150"/>
              <col width="150"/>
              <col width="150"/>
              <col width="150"/>
              <thead>
                <tr valign="top">
                  <td/>
                  <td>Medication 1</td>
                  <td>Medication 2</td>
                  <td>Medication 3</td>
                  <td>Medication 4</td>
                  <td>Cluster</td>
                </tr>
              </thead>
              <tbody>
                <tr valign="top">
                  <td>Patient 1</td>
                  <td>1</td>
                  <td>0</td>
                  <td>2</td>
                  <td>1</td>
                  <td>1</td>
                </tr>
                <tr valign="top">
                  <td>Patient 2</td>
                  <td>0</td>
                  <td>1</td>
                  <td>1</td>
                  <td>1</td>
                  <td>2</td>
                </tr>
                <tr valign="top">
                  <td>Patient 3</td>
                  <td>2</td>
                  <td>0</td>
                  <td>0</td>
                  <td>1</td>
                  <td>1</td>
                </tr>
                <tr valign="top">
                  <td>Patient 4</td>
                  <td>1</td>
                  <td>2</td>
                  <td>0</td>
                  <td>0</td>
                  <td>3</td>
                </tr>
                <tr valign="top">
                  <td>Patient 5</td>
                  <td>1</td>
                  <td>1</td>
                  <td>2</td>
                  <td>0</td>
                  <td>2</td>
                </tr>
              </tbody>
            </table>
          </table-wrap>
        </sec>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Overall Clustering Results</title>
        <p>First, PCA was used to reduce the dimensionality of the data set, resulting in 8 components explaining most of the variance of our data (ie, these components explained 62% of the total variance). We then applied the two clustering algorithms with the 8 principal components. <xref ref-type="table" rid="table5">Table 5</xref> shows the best results of the experimentation with the K-means and DBSCAN algorithms.</p>
        <p>In comparison with DBSCAN, the K-means algorithm had a higher Silhouette coefficient and a much lower number of clusters for the same data set. Moreover, K-means had a much faster execution time, which means that this algorithm presents lower computational complexity in terms of execution compared with that of DBSCAN. Therefore, the clustering results obtained with K-means were further considered for the calculation of prediction and recommendations. Analysis of the clusters was performed considering the clustering obtained with the K-means algorithm, which showed the best results.</p>
        <p>Cluster 4 had the highest number of patients, followed by clusters 2 and 6. Cluster 3 had the smallest number of patients due to the different characteristics considered to group similar patients, such as the diagnosed diseases, race, main drugs administered, and most representative age range.</p>
        <p><xref rid="figure3" ref-type="fig">Figure 3</xref> provides details about the six clusters, including the variables analyzed, such as age, gender, race, health problems, medications, and information about the doses of insulin administered to the patient.</p>
        <table-wrap position="float" id="table5">
          <label>Table 5</label>
          <caption>
            <p>Comparative analysis of the performance of the algorithms.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="250"/>
            <col width="250"/>
            <col width="250"/>
            <col width="250"/>
            <thead>
              <tr valign="top">
                <td>Algorithm</td>
                <td>Number of clusters</td>
                <td>Silhouette coefficient</td>
                <td>Execution time</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>K-means</td>
                <td>6</td>
                <td>0.654</td>
                <td>15 minutes, 24 seconds</td>
              </tr>
              <tr valign="top">
                <td>DBSCAN<sup>a</sup></td>
                <td>200</td>
                <td>0.611</td>
                <td>20 minutes, 31 seconds</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table5fn1">
              <p><sup>a</sup>DBSCAN: density-based spatial clustering of applications with noise.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>Details about the six clusters.</p>
          </caption>
          <graphic xlink:href="jmir_v24i7e37233_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Characteristics of Clusters</title>
        <sec>
          <title>Cluster 1</title>
          <p>Cluster 1 (n=875) included patients who were administered most of the drugs shown in <xref ref-type="table" rid="table3">Table 3</xref>. In this cluster, 60.6% (n=530) of the patients were female and the remaining 39.4% (n=345) were male. All patients in this group were of African American race. These patients suffered from health problems in the circulatory and respiratory systems directly related to diabetes. The most representative age range in this group was 45-75 years.</p>
        </sec>
        <sec>
          <title>Cluster 2</title>
          <p>Cluster 2 (n=910) was characterized by a homogeneous distribution of male and female patients; the main diseases diagnosed for these patients involved the respiratory system. Almost all of the patients in this group (n=867, 95.3%) were Caucasian. The main drugs administered for this group were metformin, glipizide, and glyburide, and the dosages were often changed (increased and decreased). Another relevant characteristic of this cluster is that the patients had not been administered insulin. The most representative age range of patients in this group was 55-85 years.</p>
        </sec>
        <sec>
          <title>Cluster 3</title>
          <p>In cluster 3 (n=412), the main drugs administered to patients were glyburide, metformin, and glipizide, whereas insulin had also not been administered to this group. There was diversity in the age range of the patients within this cluster, with the most representative range being 55-85 years. The patients in this cluster also tended to be diagnosed with other diseases such as metabolic disease and diseases of the nervous system. All of these patients belonged to the Caucasian race.</p>
        </sec>
        <sec>
          <title>Cluster 4</title>
          <p>The patients in cluster 4 (n=1369) were mainly administered insulin, metformin, and glipizide; although patients in this group were prescribed other drugs, their proportions were relatively lower. The main diseases diagnosed in this group of patients were diseases of the circulatory and respiratory systems. This cluster grouped the largest number of patients analyzed and the predominant age range was 55-85 years.</p>
        </sec>
        <sec>
          <title>Cluster 5</title>
          <p>Cluster 5 (n=646) was largely characterized by patients in this group having received more treatments with the following drugs: glyburide, glipizide, and metformin. Insulin had not been administered to this group, and all patients were diagnosed with diseases related to the circulatory system. The most prominent age range was 55-75 years.</p>
        </sec>
        <sec>
          <title>Cluster 6</title>
          <p>In cluster 6 (n=965), patients were mainly administered the following drugs: insulin, metformin, glipizide, and glyburide. The main diseases diagnosed in this group of patients were those of the circulatory system and diseases related to diabetes mellitus, among others. The predominant age range was 45-75 years.</p>
        </sec>
      </sec>
      <sec>
        <title>Quality of Predictions</title>
        <p>To evaluate the quality of the predictions, we used the mean squared error (MSE), which penalizes more severely when the error is higher [<xref ref-type="bibr" rid="ref20">20</xref>]. A significant MSE value of 0.53 was obtained in the test set, which means that the system is capable of obtaining good predictions. As a measure of error, a lower the error value indicates a more efficient RS [<xref ref-type="bibr" rid="ref21">21</xref>].</p>
      </sec>
      <sec>
        <title>Quality of Recommendations</title>
        <p>The quality metric is fundamental to measuring the performance of our RS, since it provides information on the proportion of recommended drugs that are relevant for the user. In our case, a drug is considered relevant when the value of the dose is greater than 1. In the experiments, a precision value of 0.61 was obtained, which indicated that the system provides acceptable recommendations.</p>
      </sec>
      <sec>
        <title>Generation of Recommendations</title>
        <p>Considering a patient “p” with diabetes who belongs to cluster “c,” a list of drugs {f<sub>1</sub>,f<sub>2</sub>,...f<sub>n</sub>} with the highest prediction score is recommended by the system. An example of the recommendation for two patients in cluster 1 is presented in <xref ref-type="table" rid="table6">Table 6</xref> based on a setting of providing the top 3 recommendations.</p>
        <p><xref ref-type="table" rid="table6">Table 6</xref> shows that the recommended medications were similar for both patients in cluster 1; however, the order of recommendation varied according to the prediction score obtained for each medication. This is to be expected since these two patients share similar characteristics in terms of clinical information, personal data, and medical treatments stored in the data set.</p>
        <table-wrap position="float" id="table6">
          <label>Table 6</label>
          <caption>
            <p>Drug recommendation for two patients with diabetes in cluster 1.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="400"/>
            <col width="600"/>
            <thead>
              <tr valign="top">
                <td>Patient ID</td>
                <td>Drugs recommended<sup>a</sup></td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>36</td>
                <td>Insulin, glipizide, metformin</td>
              </tr>
              <tr valign="top">
                <td>15</td>
                <td>Metformin, insulin, glyburide</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table6fn1">
              <p><sup>a</sup>Drugs are listed in order of preference (highest to lowest prediction score).</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Results</title>
        <p>Our analysis of the UCI Machine Learning Repository showed that most patients with diabetes have circulatory and respiratory problems, followed by metabolic and nervous system problems. Regarding gender, women with diabetes showed more circulatory and respiratory health problems compared to men. It was determined that diabetes manifests differently for individual patients. In addition, in the analysis according to race (Caucasian, African American, Hispanic, and Asian), different categories were identified according to patient and clinical characteristics: (1) older patients with circulatory, respiratory, and other problems; (2) younger patients with digestive, respiratory, and other problems; (3) patients requiring increased insulin doses; and (4) patients prescribed more than one type of medication.</p>
        <p>From the data set used, we further observed that diabetes can occur at any age; however, the disease appears to be more common among middle-aged and older people. The analysis showed that the health outcomes related to diabetes are different for each patient, both at the level of control with medication and health complications. Based on these findings, an RS is required to provide support to health care professionals to facilitate the management and control of this chronic disease. Therefore, a cluster-based RS was proposed to help recommend drugs to patients with diabetes. The clustering technique was used to identify groups of patients based on their similar characteristics, and the collaborative filtering technique was used to present information on the doses of the medications administered to patients. Our experimental results showed acceptable performance of the proposed system.</p>
      </sec>
      <sec>
        <title>Limitations and Future Work</title>
        <p>The use of explicit information (ratings) from users enables making more precise recommendations; however, according to Wasid and Ali [<xref ref-type="bibr" rid="ref22">22</xref>], additional effort is required from users when rating an item. Therefore, obtaining useful ratings without additional effort from users is one of the challenges of RSs based on collaborative filtering.</p>
        <p>A typical problem of RSs based on collaborative filtering is that data and ratings are often scarce, resulting in a problem of new user and new item cold start. An alternative solution to overcome this problem is to calculate the similarity of the users based on user profiles [<xref ref-type="bibr" rid="ref13">13</xref>]. For example, if two users are diagnosed with the same disease, they could be considered similar, even if they have not been administered the same drugs during their treatment. Other characteristics such as gender, age, medications administered to the patient, and diseases diagnosed could help classify patients into clusters. Although this study avoided the cold-start (new user) problem by using patient information for clustering and subsequent recommendation, there is a limitation with medications that are entered in the system and have not yet been prescribed to any patient, since the system would have difficulty recommending such medications (ie, new item cold-start problem).</p>
        <p>One solution to this problem is to use the metadata of the new items when making recommendations [<xref ref-type="bibr" rid="ref13">13</xref>]. Combining both user and item information would provide a hybrid approach to address the new user and new item cold-start problem. Therefore, as future work, we propose to (1) extend the recommendation approach using drug information for the prediction and recommendation process, and (2) consider the clustering results of the DBSCAN algorithm for prediction and analyze whether this can improve the quality of recommendations.</p>
      </sec>
      <sec>
        <title>Comparison With Prior Work</title>
        <p>We found some previous studies related to the topic of RSs in the health domain; however, our proposed approach differs from these previous works by focusing on combining collaborative filtering with clustering techniques to avoid the cold-start (new user) problem.</p>
        <p>The experimental results showed that our recommendation approach performs well in terms of offering good predictions and acceptable recommendations considering patient information. In comparison with the study of Sanchez et al [<xref ref-type="bibr" rid="ref13">13</xref>] who recommended educational content about diabetes, our work focuses on recommending medications to patients with diabetes. Galiano and Paccanaro [<xref ref-type="bibr" rid="ref23">23</xref>] used collaborative filtering for the prediction of medication side effects to provide recommendations to safety professionals based on a latent factor model. A latent factor method could also be considered for drug prediction to patients with diabetes, and these results can be compared with those obtained using the clustering-based recommendation approach. Consequently, RSs have been developed based on multiple methods that could be combined with clustering techniques to improve the recommendation process. For example, Chung and Jung [<xref ref-type="bibr" rid="ref24">24</xref>] proposed a knowledge-based cluster model to improve prediction accuracy and make health care recommendations.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>We present an RS that is capable of suggesting medications suitable for patients with diabetes. This system considers user metadata to alleviate the cold-start (new user) problem, obtaining groups of patients with similar characteristics using clustering techniques, which are then used to recommend drugs for patients in the same cluster.</p>
        <p>To measure the performance of the recommender system, the quality of the predictions and recommendations was evaluated. In the case of prediction accuracy, a significant MSE value was obtained and acceptable accuracy was found in the quality of recommendations, which can be further improved by using information from more drugs or combining with another collaborative filtering approach such as an item-based approach.</p>
        <p>The proposed system offers a new method to provide support to health care personnel during the medical care of patients with diabetes by offering recommendations of possible medications that can be considered for the treatment of this disease. In addition, our RS has the advantage of providing recommendations that can be easily explained since the system recommends drugs that have been administered to patients with similar characteristics to the target patient. We believe that this system could be an important tool for health personnel, as it would help to streamline the process of health care and management.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group/>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">DBSCAN</term>
          <def>
            <p>density-based spatial clustering of applications with noise</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">MSE</term>
          <def>
            <p>mean squared error</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">PCA</term>
          <def>
            <p>principal component analysis</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">RS</term>
          <def>
            <p>recommender system</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">UCI</term>
          <def>
            <p>University of California Irvine</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>The authors would like to thank the Universidad Técnica Particular de Loja for the funding received for the development of this study.</p>
    </ack>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Mao</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Recommender system application developments: A survey</article-title>
          <source>Decision Support Systems</source>
          <year>2015</year>
          <month>06</month>
          <volume>74</volume>
          <fpage>12</fpage>
          <lpage>32</lpage>
          <pub-id pub-id-type="doi">10.1016/j.dss.2015.03.008</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>De Choudhury</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Morris</surname>
              <given-names>MR</given-names>
            </name>
            <name name-style="western">
              <surname>White</surname>
              <given-names>RW</given-names>
            </name>
          </person-group>
          <article-title>Seeking and sharing health information online: comparing search engines and social media</article-title>
          <year>2014</year>
          <conf-name>CHI '14- Proceedings of the SIGCHI Conference on Human Factors in Computing Systems</conf-name>
          <conf-date>April 26-May 1, 2014</conf-date>
          <conf-loc>Toronto, ON</conf-loc>
          <publisher-name>Association for Computing Machinery</publisher-name>
          <fpage>1365</fpage>
          <lpage>1376</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dl.acm.org/doi/10.1145/2556288.2557214"/>
          </comment>
          <pub-id pub-id-type="doi">10.1145/2556288.2557214</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>GJ</given-names>
            </name>
            <name name-style="western">
              <surname>Penson</surname>
              <given-names>DF</given-names>
            </name>
          </person-group>
          <article-title>Internet health resources and the cancer patient</article-title>
          <source>Cancer Invest</source>
          <year>2008</year>
          <month>03</month>
          <volume>26</volume>
          <issue>2</issue>
          <fpage>202</fpage>
          <lpage>7</lpage>
          <pub-id pub-id-type="doi">10.1080/07357900701566197</pub-id>
          <pub-id pub-id-type="medline">18259953</pub-id>
          <pub-id pub-id-type="pii">785208482</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wong</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Cheung</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Online Health Information Seeking and eHealth Literacy Among Patients Attending a Primary Care Clinic in Hong Kong: A Cross-Sectional Survey</article-title>
          <source>J Med Internet Res</source>
          <year>2019</year>
          <month>03</month>
          <day>27</day>
          <volume>21</volume>
          <issue>3</issue>
          <fpage>e10831</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2019/3/e10831/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/10831</pub-id>
          <pub-id pub-id-type="medline">30916666</pub-id>
          <pub-id pub-id-type="pii">v21i3e10831</pub-id>
          <pub-id pub-id-type="pmcid">PMC6456826</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Stellefson</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Shuster</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chaney</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Paige</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Alber</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chaney</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Sriram</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Web-based Health Information Seeking and eHealth Literacy among Patients Living with Chronic Obstructive Pulmonary Disease (COPD)</article-title>
          <source>Health Commun</source>
          <year>2018</year>
          <month>12</month>
          <volume>33</volume>
          <issue>12</issue>
          <fpage>1410</fpage>
          <lpage>1424</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/28872905"/>
          </comment>
          <pub-id pub-id-type="doi">10.1080/10410236.2017.1353868</pub-id>
          <pub-id pub-id-type="medline">28872905</pub-id>
          <pub-id pub-id-type="pmcid">PMC6097958</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>iDoctor: Personalized and professionalized medical recommendations based on hybrid matrix factorization</article-title>
          <source>Future Generation Computer Systems</source>
          <year>2017</year>
          <month>01</month>
          <volume>66</volume>
          <fpage>30</fpage>
          <lpage>35</lpage>
          <pub-id pub-id-type="doi">10.1016/j.future.2015.12.001</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gujar</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Biyani</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Bramhane</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Bhosale</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Vaidya</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Disease prediction and doctor recommendation system</article-title>
          <source>Int Res J Eng Technol</source>
          <year>2018</year>
          <month>03</month>
          <volume>5</volume>
          <issue>3</issue>
          <fpage>3207</fpage>
          <lpage>3209</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.academia.edu/36834941/Disease_Prediction_and_Doctor_Recommendation_System"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kuanr</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Mohapatra</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Piri</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Health Recommender System for Cervical Cancer Prognosis in Women</article-title>
          <year>2021</year>
          <conf-name>2021 6th International Conference on Inventive Computation Technologies (ICICT)</conf-name>
          <conf-date>January 20-22, 2021</conf-date>
          <conf-loc>Coimbatore, India</conf-loc>
          <fpage>673</fpage>
          <lpage>679</lpage>
          <pub-id pub-id-type="doi">10.1109/ICICT50816.2021.9358540</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Princy</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Senith</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kirubaraj</surname>
              <given-names>AA</given-names>
            </name>
            <name name-style="western">
              <surname>Vijaykumar</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>A personalized food recommender system for women considering nutritional information</article-title>
          <source>Int J Pharmaceut Res</source>
          <year>2021</year>
          <month>02</month>
          <day>02</day>
          <volume>13</volume>
          <issue>02</issue>
          <pub-id pub-id-type="doi">10.31838/ijpr/2021.13.02.233</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Narducci</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Musto</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Polignano</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>de Gemmis</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Lops</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Semeraro</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>A recommender system for connecting patients to the right doctors in the HealthNet social network</article-title>
          <year>2015</year>
          <conf-name>WWW '15 Companion: Proceedings of the 24th International Conference on World Wide Web</conf-name>
          <conf-date>May 18-22, 2015</conf-date>
          <conf-loc>Florence, Italy</conf-loc>
          <fpage>81</fpage>
          <lpage>82</lpage>
          <pub-id pub-id-type="doi">10.1145/2740908.2742748</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Zou</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Luo</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Xiao</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>Predicting potential side effects of drugs by recommender methods and ensemble learning</article-title>
          <source>Neurocomputing</source>
          <year>2016</year>
          <month>01</month>
          <volume>173</volume>
          <fpage>979</fpage>
          <lpage>987</lpage>
          <pub-id pub-id-type="doi">10.1016/j.neucom.2015.08.054</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nasiri</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Minaei</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Kiani</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Dynamic recommendation: disease prediction and prevention using recommender system</article-title>
          <source>Int J Basic Sci Med</source>
          <year>2016</year>
          <month>06</month>
          <day>29</day>
          <volume>1</volume>
          <issue>1</issue>
          <fpage>13</fpage>
          <lpage>17</lpage>
          <pub-id pub-id-type="doi">10.15171/ijbsm.2016.04</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sanchez Bocanegra</surname>
              <given-names>CL</given-names>
            </name>
            <name name-style="western">
              <surname>Sevillano Ramos</surname>
              <given-names>JL</given-names>
            </name>
            <name name-style="western">
              <surname>Rizo</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Civit</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Fernandez-Luque</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>HealthRecSys: a semantic content-based recommender system to complement health videos</article-title>
          <source>BMC Med Inform Decis Mak</source>
          <year>2017</year>
          <month>05</month>
          <day>15</day>
          <volume>17</volume>
          <issue>1</issue>
          <fpage>63</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedinformdecismak.biomedcentral.com/articles/10.1186/s12911-017-0431-7"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12911-017-0431-7</pub-id>
          <pub-id pub-id-type="medline">28506225</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12911-017-0431-7</pub-id>
          <pub-id pub-id-type="pmcid">PMC5433022</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bianchini</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>De Antonellis</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>De Franceschi</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Melchiori</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>PREFer: a prescription-based food recommender system</article-title>
          <source>Comput Stand Interf</source>
          <year>2017</year>
          <month>11</month>
          <volume>54</volume>
          <fpage>64</fpage>
          <lpage>75</lpage>
          <pub-id pub-id-type="doi">10.1016/j.csi.2016.10.010</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ali</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Amin</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <person-group person-group-type="editor">
            <name name-style="western">
              <surname>Mokhtari</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Abdulrazak</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Aloulou</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>A hybrid framework for a comprehensive physical activity and diet recommendation system</article-title>
          <source>Smart Homes and Health Telematics, Designing a Better Future: Urban Assisted Living. ICOST 2018. Lecture Notes in Computer Science, vol 10898</source>
          <year>2018</year>
          <publisher-loc>Cham</publisher-loc>
          <publisher-name>Springer</publisher-name>
          <fpage>109</fpage>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nowakowska</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Zghebi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Ashcroft</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Buchan</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Chew-Graham</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Holt</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Mallen</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Van Marwijk</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Peek</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Perera-Salazar</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Reeves</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Rutter</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Weng</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Qureshi</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Mamas</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kontopantelis</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>The comorbidity burden of type 2 diabetes mellitus: patterns, clusters and predictions from a large English primary care cohort</article-title>
          <source>BMC Med</source>
          <year>2019</year>
          <month>07</month>
          <day>25</day>
          <volume>17</volume>
          <issue>1</issue>
          <fpage>145</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedicine.biomedcentral.com/articles/10.1186/s12916-019-1373-y"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12916-019-1373-y</pub-id>
          <pub-id pub-id-type="medline">31345214</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12916-019-1373-y</pub-id>
          <pub-id pub-id-type="pmcid">PMC6659216</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dong</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>MZ</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Cui</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Qiao</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>Clustering patterns of type-type combination in multiple genotypes infections of human papillomavirus in cervical adenocarcinoma</article-title>
          <source>J Med Virol</source>
          <year>2019</year>
          <month>11</month>
          <day>07</day>
          <volume>91</volume>
          <issue>11</issue>
          <fpage>2001</fpage>
          <lpage>2008</lpage>
          <pub-id pub-id-type="doi">10.1002/jmv.25553</pub-id>
          <pub-id pub-id-type="medline">31347710</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dua</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Graff</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <source>UCI Machine Learning Repository</source>
          <year>2019</year>
          <access-date>2022-06-27</access-date>
          <publisher-name>Irvine, CA: University of California, School of Information and Computer Science</publisher-name>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://archive.ics.uci.edu/ml/index.php">https://archive.ics.uci.edu/ml/index.php</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Strack</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>DeShazo</surname>
              <given-names>JP</given-names>
            </name>
            <name name-style="western">
              <surname>Gennings</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Olmo</surname>
              <given-names>JL</given-names>
            </name>
            <name name-style="western">
              <surname>Ventura</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Cios</surname>
              <given-names>KJ</given-names>
            </name>
            <name name-style="western">
              <surname>Clore</surname>
              <given-names>JN</given-names>
            </name>
          </person-group>
          <article-title>Impact of HbA1c measurement on hospital readmission rates: analysis of 70,000 clinical database patient records</article-title>
          <source>Biomed Res Int</source>
          <year>2014</year>
          <volume>2014</volume>
          <fpage>781670</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.hindawi.com/journals/bmri/2014/781670/">https://www.hindawi.com/journals/bmri/2014/781670/</ext-link>
          </comment>
          <pub-id pub-id-type="doi">10.1155/2014/781670</pub-id>
          <pub-id pub-id-type="medline">24804245</pub-id>
          <pub-id pub-id-type="pmcid">PMC3996476</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Performance Evaluation of Recommender Systems</article-title>
          <source>Int J Performability Eng</source>
          <year>2017</year>
          <volume>13</volume>
          <issue>8</issue>
          <fpage>1246</fpage>
          <lpage>1256</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://paris.utdallas.edu/IJPE/Vol13/Issue08/IJPE-2017-08-07.pdf"/>
          </comment>
          <pub-id pub-id-type="doi">10.23940/ijpe.17.08.p7.12461256</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Yan</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Deng</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Gao</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Rating prediction of recommended item based on review deep learning and rating probability matrix factorization</article-title>
          <source>Electronic Commerce Research and Applications</source>
          <year>2022</year>
          <month>5</month>
          <day>09</day>
          <fpage>101160</fpage>
          <pub-id pub-id-type="doi">10.1016/j.elerap.2022.101160</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wasid</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ali</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>An improved recommender system based on multi-criteria clustering approach</article-title>
          <source>Procedia Comput Sci</source>
          <year>2018</year>
          <volume>131</volume>
          <fpage>93</fpage>
          <lpage>101</lpage>
          <pub-id pub-id-type="doi">10.1016/j.procs.2018.04.190</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Galeano</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Paccanaro</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>A recommender system approach for predicting drug side effects</article-title>
          <year>2018</year>
          <conf-name>2018 International Joint Conference on Neural Networks (IJCNN)</conf-name>
          <conf-date>July 8-23, 2018</conf-date>
          <conf-loc>Rio de Janeiro, Brazil</conf-loc>
          <pub-id pub-id-type="doi">10.1109/ijcnn.2018.8489025</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chung</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Jung</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Knowledge-based dynamic cluster model for healthcare management using a convolutional neural network</article-title>
          <source>Inf Technol Manag</source>
          <year>2019</year>
          <month>08</month>
          <day>12</day>
          <volume>21</volume>
          <issue>1</issue>
          <fpage>41</fpage>
          <lpage>50</lpage>
          <pub-id pub-id-type="doi">10.1007/s10799-019-00304-1</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
