<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMIR</journal-id>
      <journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id>
      <journal-title>Journal of Medical Internet Research</journal-title>
      <issn pub-type="epub">1438-8871</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
    <article-id pub-id-type="publisher-id">v20i9e263</article-id>
    <article-id pub-id-type="pmid">30249589</article-id>
    <article-id pub-id-type="doi">10.2196/jmir.9227</article-id>
    <article-categories>
      <subj-group subj-group-type="heading">
        <subject>Original Paper</subject>
      </subj-group>
      <subj-group subj-group-type="article-type">
        <subject>Original Paper</subject>
      </subj-group>
    </article-categories>
    <title-group>
      <article-title>Improving Prediction of Risk of Hospital Admission in Chronic Obstructive Pulmonary Disease: Application of Machine Learning to Telemonitoring Data</article-title>
    </title-group>
    <contrib-group>
      <contrib contrib-type="editor">
        <name>
          <surname>Eysenbach</surname>
          <given-names>Gunther</given-names>
        </name>
      </contrib>
    </contrib-group>
    <contrib-group>
      <contrib contrib-type="reviewer">
        <name>
          <surname>Velardo</surname>
          <given-names>Carmelo</given-names>
        </name>
      </contrib>
      <contrib contrib-type="reviewer">
        <name>
          <surname>Limsopatham</surname>
          <given-names>Nut</given-names>
        </name>
      </contrib>
      <contrib contrib-type="reviewer">
        <name>
          <surname>Wang</surname>
          <given-names>Yanshan</given-names>
        </name>
      </contrib>
    </contrib-group>
    <contrib-group>
      <contrib contrib-type="author" id="contrib1">
        <name name-style="western">
          <surname>Orchard</surname>
          <given-names>Peter</given-names>
        </name>
        <degrees>MSci, MSc, PhD</degrees>
        <xref rid="aff1" ref-type="aff">1</xref>
        <ext-link ext-link-type="orcid">http://orcid.org/0000-0003-1330-9528</ext-link>
      </contrib>
      <contrib contrib-type="author" id="contrib2">
        <name name-style="western">
          <surname>Agakova</surname>
          <given-names>Anna</given-names>
        </name>
        <degrees>MSc, MEng</degrees>
        <xref rid="aff1" ref-type="aff">1</xref>
        <ext-link ext-link-type="orcid">http://orcid.org/0000-0003-3722-0843</ext-link>
      </contrib>
      <contrib contrib-type="author" id="contrib3">
        <name name-style="western">
          <surname>Pinnock</surname>
          <given-names>Hilary</given-names>
        </name>
        <degrees>MBChB, MD, MRCGP</degrees>
        <xref rid="aff2" ref-type="aff">2</xref>
        <ext-link ext-link-type="orcid">http://orcid.org/0000-0002-5976-8386</ext-link>
      </contrib>
      <contrib contrib-type="author" id="contrib4">
        <name name-style="western">
          <surname>Burton</surname>
          <given-names>Christopher David</given-names>
        </name>
        <degrees>MBChB, MD, FRCGP</degrees>
        <xref rid="aff3" ref-type="aff">3</xref>
        <ext-link ext-link-type="orcid">http://orcid.org/0000-0003-0233-2431</ext-link>
      </contrib>
      <contrib contrib-type="author" id="contrib5">
        <name name-style="western">
          <surname>Sarran</surname>
          <given-names>Christophe</given-names>
        </name>
        <degrees>MPhys, PhD</degrees>
        <xref rid="aff4" ref-type="aff">4</xref>
        <ext-link ext-link-type="orcid">http://orcid.org/0000-0003-0605-8839</ext-link>
      </contrib>
      <contrib contrib-type="author" id="contrib6">
        <name name-style="western">
          <surname>Agakov</surname>
          <given-names>Felix</given-names>
        </name>
        <degrees>MSc, PhD</degrees>
        <xref rid="aff1" ref-type="aff">1</xref>
        <ext-link ext-link-type="orcid">http://orcid.org/0000-0003-4280-9062</ext-link>
      </contrib>
      <contrib contrib-type="author" id="contrib7" corresp="yes">
      <name name-style="western">
        <surname>McKinstry</surname>
        <given-names>Brian</given-names>
      </name>
      <degrees>MBChB, MD, FRCP(Edin), FRCGP, FFCI</degrees>
      <xref rid="aff2" ref-type="aff">2</xref>
      <address>
        <institution>Usher Institute of Population Health Sciences and Informatics</institution>
        <institution>University of Edinburgh</institution>
        <addr-line>Number Nine Bioquarter</addr-line>
        <addr-line>9 Little France Road</addr-line>
        <addr-line>Edinburgh, EH16 4UX</addr-line>
        <country>United Kingdom</country>
        <phone>44 1316502378</phone>
        <email>brian.mckinstry@ed.ac.uk</email>
      </address>  
      <ext-link ext-link-type="orcid">http://orcid.org/0000-0001-9581-0468</ext-link></contrib>
    </contrib-group>
    <aff id="aff1">
      <label>1</label>
      <institution>Pharmatics</institution>
      <addr-line>Edinburgh</addr-line>
      <country>United Kingdom</country>
    </aff>
    <aff id="aff2">
    <label>2</label>
    <institution>Usher Institute of Population Health Sciences and Informatics</institution>
    <institution>University of Edinburgh</institution>  
    <addr-line>Edinburgh</addr-line>
    <country>United Kingdom</country></aff>
    <aff id="aff3">
    <label>3</label>
    <institution>Academic Unit of Primary Medical Care</institution>
    <institution>University of Sheffield</institution>  
    <addr-line>Sheffield</addr-line>
    <country>United Kingdom</country></aff>
    <aff id="aff4">
      <label>4</label>
      <institution>Met Office</institution>
      <addr-line>Exeter</addr-line>
      <country>United Kingdom</country>
    </aff>
    <author-notes>
      <corresp>Corresponding Author: Brian McKinstry 
      <email>brian.mckinstry@ed.ac.uk</email></corresp>
    </author-notes>
    <pub-date pub-type="collection">
      <month>9</month>
      <year>2018</year>
    </pub-date>
    <pub-date pub-type="epub">
      <day>21</day>
      <month>9</month>
      <year>2018</year>
    </pub-date>
    <volume>20</volume>
    <issue>9</issue>
    <elocation-id>e263</elocation-id>
    <!--history from ojs - api-xml-->
    <history>
      <date date-type="received">
        <day>30</day>
        <month>10</month>
        <year>2017</year>
      </date>
      <date date-type="rev-request">
        <day>19</day>
        <month>2</month>
        <year>2018</year>
      </date>
      <date date-type="rev-recd">
        <day>19</day>
        <month>4</month>
        <year>2018</year>
      </date>
      <date date-type="accepted">
        <day>18</day>
        <month>6</month>
        <year>2018</year>
      </date>
    </history>
    <!--(c) the authors - correct author names and publication date here if necessary. Date in form ', dd.mm.yyyy' after jmir.org-->
    <copyright-statement>©Peter Orchard, Anna Agakova, Hilary Pinnock, Christopher David Burton, Christophe Sarran, Felix Agakov, Brian McKinstry. Originally published in the Journal of Medical Internet Research (http://www.jmir.org), 21.09.2018.</copyright-statement>
    <copyright-year>2018</copyright-year>
    <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
      <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research, is properly cited. The complete bibliographic information, a link to the original publication on http://www.jmir.org/, as well as this copyright and license information must be included.</p>
    </license>  
    <self-uri xlink:href="http://www.jmir.org/2018/9/e263/" xlink:type="simple"/>
    <abstract>
      <sec sec-type="Background">
        <title>Background</title>
        <p>Telemonitoring of symptoms and physiological signs has been suggested as a means of early detection of chronic obstructive pulmonary disease (COPD) exacerbations, with a view to instituting timely treatment. However, algorithms to identify exacerbations result in frequent false-positive results and increased workload. Machine learning, when applied to predictive modelling, can determine patterns of risk factors useful for improving prediction quality.</p>
      </sec>
      <sec sec-type="Objective">
        <title>Objective</title>
        <p>Our objectives were to (1) establish whether machine learning techniques applied to telemonitoring datasets improve prediction of hospital admissions and decisions to start corticosteroids, and (2) determine whether the addition of weather data further improves such predictions.</p>
      </sec>
      <sec sec-type="Methods">
        <title>Methods</title>
        <p>We used daily symptoms, physiological measures, and medication data, with baseline demography, COPD severity, quality of life, and hospital admissions from a pilot and large randomized controlled trial of telemonitoring in COPD. We linked weather data from the United Kingdom meteorological service. We used feature selection and extraction techniques for time series to construct up to 153 predictive patterns (features) from symptom, medication, and physiological measurements. We used the resulting variables to construct predictive models fitted to training sets of patients and compared them with common symptom-counting algorithms.</p>
      </sec>
      <sec sec-type="Results">
        <title>Results</title>
        <p>We had a mean 363 days of telemonitoring data from 135 patients. The two most practical traditional score-counting algorithms, restricted to cases with complete data, resulted in area under the receiver operating characteristic curve (AUC) estimates of 0.60 (95% CI 0.51-0.69) and 0.58 (95% CI 0.50-0.67) for predicting admissions based on a single day’s readings. However, in a real-world scenario allowing for missing data, with greater numbers of patient daily data and hospitalizations (N=57,150, N<sup>+</sup>=55, respectively), the performance of all the traditional algorithms fell, including those based on 2 days’ data. One of the most frequently used algorithms performed no better than chance. All considered machine learning models demonstrated significant improvements; the best machine learning algorithm based on 57,150 episodes resulted in an aggregated AUC of 0.74 (95% CI 0.67-0.80). Adding weather data measurements did not improve the predictive performance of the best model (AUC 0.74, 95% CI 0.69-0.79). To achieve an 80% true-positive rate (sensitivity), the traditional algorithms were associated with an 80% false-positive rate: our algorithm halved this rate to approximately 40% (specificity approximately 60%). The machine learning algorithm was moderately superior to the best symptom-counting algorithm (AUC 0.77, 95% CI 0.74-0.79 vs AUC 0.66, 95% CI 0.63-0.68) at predicting the need for corticosteroids.</p>
      </sec>
      <sec sec-type="Conclusions">
        <title>Conclusions</title>
        <p>Early detection and management of COPD remains an important goal given its huge personal and economic costs. Machine learning approaches, which can be tailored to an individual’s baseline profile and can learn from experience of the individual patient, are superior to existing predictive algorithms and show promise in achieving this goal.</p>
      </sec>
      <sec sec-type="Trial Registration">
        <title>Trial Registration</title>
        <p>International Standard Randomized Controlled Trial Number ISRCTN96634935; http://www.isrctn.com/ISRCTN96634935 (Archived by WebCite at http://www.webcitation.org/722YkuhAz)</p>
      </sec>
    </abstract>
    <kwd-group>
      <kwd>machine learning</kwd>
      <kwd>telemedicine</kwd>
      <kwd>chronic obstructive pulmonary disease</kwd>
    </kwd-group></article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <sec>
        <title>Background</title>
        <p>Exacerbations of chronic obstructive pulmonary disease (COPD) are a major cause of acute hospitalizations. Prompt intervention with antibiotics and corticosteroids may prevent admissions and improve quality of life [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref2">2</xref>], but difficulties in recognizing early symptoms of deterioration [<xref ref-type="bibr" rid="ref3">3</xref>] often result in delays in accessing care [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref4">4</xref>] and starting treatment. Telemonitoring of symptoms and physiological measurements has been advocated to facilitate early identification and treatment of exacerbations. However, despite patients’ perceptions [<xref ref-type="bibr" rid="ref4">4</xref>], the evidence from randomized controlled trials that telehealth prevents admissions is less than convincing [<xref ref-type="bibr" rid="ref5">5</xref>-<xref ref-type="bibr" rid="ref9">9</xref>]. One reason for this is that, far from clarifying the early detection of exacerbations, previously employed algorithms (typically based on international definitions of exacerbations [<xref ref-type="bibr" rid="ref10">10</xref>]) generate frequent, clinically unnecessary alerts [<xref ref-type="bibr" rid="ref11">11</xref>].</p>
        <p>New symptom-based algorithms have been designed to improve identification and assessment of established exacerbations [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref13">13</xref>]. There is some evidence that a composite measure combining oxygen saturation and heart rate with symptoms may predict deteriorations requiring treatment with antibiotics or corticosteroids [<xref ref-type="bibr" rid="ref14">14</xref>], although these physiological measures have marked day-to-day variation, which may obscure subtle changes due to early exacerbations in individual patients [<xref ref-type="bibr" rid="ref15">15</xref>]. The optimal algorithm is thus not yet clear.</p>
        <p>Recently, there have been major advances in developing computational and statistical methods for analyzing noisy, incomplete data, broadly described as machine learning and data mining [<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref17">17</xref>]. When applied to predictive modelling, such methods can determine patterns of risk factors useful for improving the quality of predictions. This is in contrast to conventional algorithms, which typically use a small number of established risk factors. However, these techniques are not yet in use for predicting hospital admissions for COPD in patients undergoing telemonitoring.</p>
      </sec>
      <sec>
        <title>Objective</title>
        <p>Data from the Telescot COPD telemonitoring program [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref11">11</xref>] included daily symptom and physiological measures, which could be linked with health care use (consultations, prescription of medication, and hospital admission); baseline data on age, severity of COPD, comorbidity, and anxiety and depression scores; and contextual data (such as weather conditions from the Met Office (the United Kingdom [UK] meteorological service) [<xref ref-type="bibr" rid="ref18">18</xref>]. Using machine learning and high-dimensional data mining, we aimed to use this large dataset to identify patterns predictive of hospital admissions or decisions to start corticosteroids.</p>
      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <p>The Telescot COPD trial (ISRCTN 96634935) [<xref ref-type="bibr" rid="ref11">11</xref>] was undertaken in 2009-2011 preceded by a pilot study [<xref ref-type="bibr" rid="ref4">4</xref>] in 2008 in Lothian, Scotland. Ethical approval was granted by the Lothian research ethics committee (reference 08/S1101/60), with UK National Health Service (NHS) management approval from NHS Lothian, Scotland.</p>
      <sec>
        <title>Datasets and Handling</title>
        <p>The telemonitoring database of day-to-day symptoms and physiological measures from the Telescot COPD trial [<xref ref-type="bibr" rid="ref11">11</xref>] and pilot study [<xref ref-type="bibr" rid="ref4">4</xref>] was held by the NHS. These were linked in the Lothian safe haven with trial data held by the research team and hospital admission data. Datasets were deidentified before analysis.</p>
        <sec>
          <title>The Telemonitoring Dataset</title>
          <p>The Telescot COPD program [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref11">11</xref>] included 146 patients who had moderate to severe COPD (forced expiratory volume in the first second of expiration [FEV<sub>1</sub>] and forced vital capacity both &#60;70%) and at least one admission to hospital in the previous year for an exacerbation of COPD. They recorded data with some gaps over an average of 16 months. Patients were asked to provide daily symptoms and physiological readings (pulse and oxygen saturation, and a subset of the study population also provided spirometry data on a less regular basis) and to record antibiotic and corticosteroid use. The symptom score was based on the presence of major symptoms (scored 2) or minor symptoms (scored 1) based on the work of Anthonisen et al [<xref ref-type="bibr" rid="ref19">19</xref>] and others [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref15">15</xref>] (see <xref ref-type="boxed-text" rid="box1">Textbox 1</xref>). Data were checked daily by a respiratory professional or trained telehealth monitor, and patients were contacted if their symptom score rose above 5. Acceptable ranges for pulse rate and oxygen saturation were set individually, and patients were contacted if readings fell beyond these ranges.</p>
          <boxed-text id="box1" position="float">
            <title>Definitions of chronic obstructive pulmonary disease exacerbation onsets on day 
            <italic>t</italic> used as predictors of hospital admissions on day 
            <italic>t</italic>+1. Note that the last 3 definitions cannot be used for this evaluation unless an early detection can be made, as they detect an onset of an exacerbation with a 1-day delay. For these definitions, we report an approximate upper bound on the predictive performance under the assumption that the exacerbations can be detected.</title>
            <p><list list-type="order"><list-item><p><bold>Major symptoms</bold><list list-type="alpha-lower"><list-item><p>Breathlessness, sputum color, and sputum amount.</p></list-item></list></p></list-item><list-item><p><bold>Minor symptoms</bold><list list-type="alpha-lower"><list-item><p>Cold, wheeze, sore throat, cough, and fever.</p></list-item></list></p></list-item><list-item><p><bold>Symptom counts</bold><list list-type="alpha-lower"><list-item><p>nMajor = number of major symptoms present on day <italic>t</italic>,</p></list-item><list-item><p>nMinor = number of minor symptoms present on day <italic>t</italic>,</p></list-item><list-item><p>nAll = nMajor + nMinor.</p></list-item></list></p></list-item><list-item><p><bold>Definitions</bold><list list-type="alpha-lower"><list-item><p>Definition 1 (after Anthonisen et al. [<xref ref-type="bibr" rid="ref19">19</xref>]): nMajor≥2.</p></list-item><list-item><p>Definition 2 (modification of Rodriguez-Roisin [<xref ref-type="bibr" rid="ref10">10</xref>]): nAll≥5.</p></list-item><list-item><p>Definition 3 (modification of Exacerbation 1 as in Seemungal et al. <xref ref-type="bibr" rid="ref2">2</xref>]): define a 'bad day' as one where (nMajor≥2) or ([nMajor=1] and [nMinor≥1]). An exacerbation is said to occur on day <italic>t</italic> if days <italic>t</italic> and <italic>t</italic> +1 are bad, but days <italic>t</italic> –1 and <italic>t</italic> –2 are not bad.</p></list-item><list-item><p>Definition 4 (modification of Seemungal et al. <xref ref-type="bibr" rid="ref2">2</xref>] as in Burton et al. <xref ref-type="bibr" rid="ref15">15</xref>): Like Definition 3, but a bad day is defined as one where (nMajor≥1) and (nAll≥3).</p></list-item><list-item><p>Definition 5 (after Pinnock et al. <xref ref-type="bibr" rid="ref11">11</xref>): An exacerbation is said to occur on day <italic>t</italic> if: <list list-type="roman-lower"><list-item><p>(nAll≥5) on day <italic>t</italic>, or</p></list-item><list-item><p>(nAll=4) on day <italic>t</italic> and (nAll≥4) on day <italic>t</italic> +1.</p></list-item></list></p></list-item></list></p></list-item></list></p>
          </boxed-text>
        </sec>
        <sec>
          <title>Trial Data</title>
          <p>Baseline trial data on demographic characteristics, body mass index, spirometry, Medical Research Council Dyspnoea Scale [<xref ref-type="bibr" rid="ref20">20</xref>], Hospital Anxiety and Depression Scale [<xref ref-type="bibr" rid="ref21">21</xref>], St George’s Respiratory Questionnaire [<xref ref-type="bibr" rid="ref22">22</xref>], previous hospital admissions, and comorbidity were also available. At the end of the trial, we searched hospital records for admissions during the trial, and 2 clinicians determined whether the admission was due to COPD, partly due to COPD, or unrelated to COPD.</p>
        </sec>
        <sec>
          <title>Met Office Health Forecasting Data</title>
          <p>The UK Met Office Healthy Outlook service uses a rule-based model, combining observed and forecast parameters, including season, humidity, temperature, air quality, and rates of influenza-like illness to issue forecasts. These have been shown to provide a 10-day warning of periods of higher risk of COPD exacerbations at a population level [<xref ref-type="bibr" rid="ref18">18</xref>], but it is unclear whether this is predictive at an individual level. We hypothesized that including Met Office data along with telemonitoring and baseline data would improve the algorithm’s prediction. We therefore combined the telemonitoring dataset with the Met Office COPD health forecasting dataset. This consisted of the outputs of the Met Office’s Healthy Outlook COPD alert algorithm [<xref ref-type="bibr" rid="ref18">18</xref>], maximum and mean temperatures in the last 48 hours, and 3 binary temperature indicators (mean temperature &#60;2°C, maximum temperature &#60;4°C, and maximum temperature &#60;7°C).</p>
        </sec>
        <sec>
          <title>Choice of Outcomes</title>
          <p>We gave patients taking part in the study an individualized action plan, which typically advised starting antibiotics if their symptom score exceeded 5, so antibiotic courses were very frequent events. As a proxy for more serious exacerbations, we tested the prediction of two main outcomes: admission to hospital for COPD and initiation of oral corticosteroid treatment.</p>
        </sec>
        <sec>
          <title>Preprocessing</title>
          <p>We defined <italic>patient episodes</italic> as sliding windows of patient-generated data for a fixed number of consecutive days up to the current day (inputs), linked to the admission or corticosteroid outcome on the following day (output).</p>
          <p>We considered the simple score-counting algorithm in the complete-data setting, where we used only episodes without any missing symptom variables to compute risk scores for 1- or 2-day windows. Additionally, we evaluated the score-counting algorithms and the machine learning models in the imputation setting using identical patient episodes, where we imputed each missing variable by copying the last observation of that variable for that patient for up to 15 days. We excluded episodes where the outcome variable was missing and patient episodes where we could not impute the observations due to long windows of no provided data. Where we used imputation, for each variable in the patient episode, we defined an auxiliary indicator to encode whether the input variable was imputed or provided by patient; we used these auxiliary variables as additional inputs into the machine learning models. Note that the sample size and the number of admissions for the imputation setting were higher than those for the complete-data setting. For example, if some measurements were not reported prior to a hospital admission, then we excluded the episode from the complete-data analysis, but we could retain it in the imputed setting when the reported variables were exact and the missing variables were imputed.</p>
        </sec>
      </sec>
      <sec>
        <title>Data Analysis</title>
        <p>We identified a large number of potentially predictive features by using established data mining techniques (see below) and tested them in combinations using nested cross-validation procedures, where we selected and extracted the feature by using only the inner training folds of data. Because data were incomplete, we conducted separate analyses (1) limited to time periods with no missing data, and (2) from all time periods with imputation of missing data.</p>
        <sec>
          <title>Identification of Novel Features</title>
          <p>For each patient, we constructed up to 153 predictive patterns (features) from symptom, medication, and physiological measurements, by using feature extraction techniques for time series [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref24">24</xref>], hypothesized to be predictive of the future events [<xref ref-type="bibr" rid="ref2">2</xref>] (see <xref ref-type="app" rid="app1">Multimedia Appendix 1</xref>). The exact number varied between the complete and imputed settings and depended on which types of variables (telemonitoring, weather, and their combinations) we used as inputs. We imputed variables measured at baseline by using population medians for the continuous variables or population modes for the categorical variables, and we assumed the variables to be fixed (stationary) throughout the study. We used the resulting variables to construct predictive models fitted to the training sets of patients. We used only the past, and not the future, variables for imputing the missing variables or constructing the time-series features for each patient episode. The resulting variables were combined to learn additional features in the hidden layers (neural nets), used for computing feature-space similarity functions (nonparametric methods), or combined with feature selection by filtering [<xref ref-type="bibr" rid="ref25">25</xref>] to set priors on hyperparameters (adaptive regularized classifiers) during training. When we used the output variables directly or indirectly to select or extract the features during training, we ensured that the procedure was nested within the training folds, so that the data used for the evaluations remained unseen.</p>
        </sec>
        <sec>
          <title>Standard Exacerbation Models</title>
          <p>We considered several definitions of exacerbations based on the criteria of Anthonisen et al [<xref ref-type="bibr" rid="ref19">19</xref>] and clinical guidelines [<xref ref-type="bibr" rid="ref26">26</xref>] and used in studies on COPD exacerbations [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref15">15</xref>]. Major symptoms were changes in patients’ self-reported <italic>breathlessness</italic>, <italic>sputum color</italic>, and <italic>sputum amount</italic>, and minor symptoms were cold, wheeze, sore throat, cough, and fever. Using definitions from the literature, we considered 5 definitions of exacerbation (<xref ref-type="boxed-text" rid="box1">Textbox 1</xref>). We evaluated the onsets of exacerbations on a given day (<italic>t</italic>) as predictors of admissions the following day (<italic>t</italic> +1). Note that, from the considered definitions, only definitions 1 and 2 could be used for this type of evaluation. For example, definition 3 is defined as the presence of at least two consecutive days of major symptoms, or one major and at least one minor symptom, with the exacerbation onset taken to be the first day when the symptom criteria are met [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref27">27</xref>], whereas definition 4 is its slight modification [<xref ref-type="bibr" rid="ref15">15</xref>]. Thus, for definitions 3 to 5, by using the exacerbation indicator on day <italic>t</italic> as a marker of an admission on day <italic>t</italic> +1, we evaluated an upper bound on the predictive performance under the assumption that these exacerbations can be detected early (eg, by making accurate predictions of the future symptoms).</p>
        </sec>
        <sec>
          <title>Novel Predictive Modeling</title>
          <p>We assessed how well we could predict hospital admissions and decisions to start corticosteroid treatment in patients undergoing telemonitoring using the extracted features. We considered several types of models. (1) Nonparametric predictive methods, such as sparse maximum-margin classifiers [<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref29">29</xref>]: these approaches allow for complex mappings from covariates to target outcomes to obtain high-quality “black-box” predictions. (2) Regularized classifiers based on the adaptive extensions of elastic nets [<xref ref-type="bibr" rid="ref30">30</xref>]: in low dimensions, these methods have the advantage of generating intelligible predictions, but they may sometimes result in lower predictive performance than nonparametric methods or ensembles due to rigid constraints on the mappings between covariates and outcomes. (3) Ensembles of boosted classifiers [<xref ref-type="bibr" rid="ref31">31</xref>] that we expected to be well suited for dealing with highly imbalanced datasets such as ours (where the number of episodes corresponding to COPD admissions was several orders of magnitude lower than the number of episodes without admissions). (4) Long short-term memory multitask neural network models: these methods are state-of-the-art for speech recognition, where very large datasets are available [<xref ref-type="bibr" rid="ref32">32</xref>]. However, we found their performance to be only a little better than that of the other models for our smaller incomplete imbalanced dataset. We considered these models using the preprocessing strategy discussed above and using training by a variant of back-propagation for recurrent networks.</p>
          <p>We repeated the procedure by considering features occurring (1) 24 hours prior to hospitalization or earlier, and (2) 24 hours prior to the decision to start corticosteroids or earlier. We fitted models 1 and 2 by regressing the outcomes on telemonitoring only (physiological, medication, and symptom variables), weather variables only, and telemonitoring and weather variables jointly. We used the more computationally expensive models (3 and 4) for regressing the outcomes on the telemonitoring variables in the imputed scenario. Hyperparameters were learned by the grid search (models 1 and 2) or by random search (models 3 and 4) over inner folds in the nested cross-validation procedure.</p>
          <p>We compared these methods with the conventional algorithms using multiple definitions of exacerbations from <xref ref-type="boxed-text" rid="box1">Textbox 1</xref> as predictors of the future clinical admissions and corticosteroid therapy.</p>
        </sec>
        <sec>
          <title>Validation of Novel Predictive Models</title>
          <p>To test this range of models, we used <italic>k</italic>-fold cross-validation, in which we split the data into <italic>k</italic> disjoint subsets (“folds”) of equal size, and fitted the models repeatedly to <italic>k</italic> –1 training folds, evaluating them on the remaining test fold. The procedure was repeated <italic>k</italic> times, and the overall performance was evaluated by aggregating the results across the test folds. During the nested cross-validation, we performed the cross-validation procedure for each choice of test data in a nested loop, where we used the inner training folds for feature extraction and selection and for estimating model parameters, we used the inner validation folds for estimating hyperparameters (such as the degree of model complexity), and we used the outer test folds purely for the performance evaluation. In our implementation of the procedure, we ensured that the test outer folds were made up of individuals who did not appear in the training sets or the inner folds (ie, we used no patient episodes for individuals from test datasets as any part of the training data). Thus, we used the outer test sets of patients purely for evaluations, and not for variable selection, parameter learning, or hyperparameter learning. We evaluated the predictive performance expressed as the aggregated area under the receiver operating characteristic curve (AUC), a calibration-invariant measure of predictive performance of binary classifiers. The aggregation was achieved by merging the predictions of the classifiers across the test folds and by averaging the merged AUC across multiple repetitions of cross-validation with the random fold partitions.</p>
        </sec>
        <sec>
          <title>Experimental Comparison</title>
          <p>We excluded 11 individuals with more than 95% missing data and analyzed data for 135 individuals who provided symptoms and physiological measurements regularly. We chose the outer folds to have approximately the same number of patient episodes, although an equal splitting could not be guaranteed, as patients had unequal numbers of the reported measurements. We used 10 inner and 10 outer folds of the nested cross-validation procedure for all but the most computationally expensive models. To evaluate the variation in the performance, we used 10 runs of the nested cross-validation with different training or test fold partitions.</p>
          <p>We evaluated simple score-counting algorithms that did not need long series of past symptoms to generate predictions, both in the complete and in the imputation scenarios. We used machine learning models that needed longer sequences of partially missing past observations in the imputation scenario. In that scenario, we excluded all patient episodes that we could not impute according to the considered procedure due to too much data being missing. For a fair comparison of multiple models, we ensured the consistency of the imputations and patient episodes across the folds.</p>
        </sec>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Predicting Hospital Admissions of Individuals</title>
        <p>In the complete-data scenario, we evaluated how well the traditional definitions of exacerbation onset on one day predicted 24-hour hospital admissions the following day, using the definitions from <xref ref-type="boxed-text" rid="box1">Textbox 1</xref>. Depending on the choice of the algorithm, we had between 14,106 and 17,610 patient episodes, and between 8 and 17 hospital admissions. We obtained the best predictions by using definition 5 (mean AUC 0.657, 95% CI 0.523-0.792, N=16,170 patient episodes, where we computed the error bars on the AUC as the consensus estimate of the methods of empirical resampling, Chebyshev, and DeLong and colleagues [<xref ref-type="bibr" rid="ref33">33</xref>]; <xref ref-type="table" rid="table1">Table 1</xref>); however, we based this estimate on a dataset with only N<sup>+</sup>=9 admissions. Additionally, using this definition, an exacerbation starting on one day could only be detected when the score remained elevated the following day (see <xref ref-type="boxed-text" rid="box1">Textbox 1</xref>), making it impractical for predicting an admission on the second day. Score-counting algorithms definitions 1 and 2, where onsets of exacerbations are computed on a single day, resulted in the AUC estimates of 0.600 (95% CI 0.509-0.692) and 0.578 (95% CI 0.496-0.672), respectively, for N=17,610 episodes and N<sup>+</sup>=17 admissions (<xref ref-type="table" rid="table1">Table 1</xref>).</p>
        <p>When evaluated in the pragmatic imputed-data scenario allowing for missing data, with a greater number of patient episodes (N=57,150) and a greater number of hospital admissions preceded by the symptom and physiological measurements (N<sup>+</sup>=55), the performance of all the traditional definitions of exacerbation dropped to near random. For example, for definition 2, we obtained an AUC of 0.524 (95% CI 0.486-0.544); see <xref ref-type="table" rid="table1">Table 1</xref>. The most likely reason for this drop was the need to rely on a simple imputation strategy due to the limited availability of daily symptom data on the days preceding hospital admissions.</p>
        <p>Machine learning models demonstrated significant improvements in the prediction of future admissions over the traditional symptom-counting methods. Working with the imputed-data scenario, the best machine learning model (neural net) using telemonitoring data resulted in the aggregated AUC of 0.740 (95% CI 0.673-0.803) evaluated on test data for N=57,150 episodes, N<sup>+</sup>=55 admissions (<xref ref-type="table" rid="table1">Table 1</xref>). The other machine learning models had similar performance, with the mean aggregated AUC of 0.721-0.738, which shows that the improvement over symptom scores could be achieved across a range of models (see <xref ref-type="app" rid="app2">Multimedia Appendix 2</xref>). To achieve an 80% true-positive rate (sensitivity), the traditional algorithms were associated with an 80% false-positive rate (20% specificity); our algorithm halved this rate to approximately 40% (specificity around 60%).</p>
        <p>Adding the weather data (the Healthy Outlook criterion and the additional weather-related variables) to the telemonitoring measurements resulted in no significant improvement in the predictive performance of the best model, with the aggregated AUC of 0.739 (95% CI 0.685-0.794, N=57,150, N<sup>+</sup>=55). This cannot be explained by the weather variables being correlated with the telehealth variables, as the best model using the weather data only had the near-random AUC of 0.526 (95% CI 0.504-0.548, N=107,078, N<sup>+</sup>=151).</p>
        <p>The best model for admissions refitted to the entire dataset following the model selection used 135 variables and was difficult to characterize. By linearizing its outputs, we found that the factors contributing most to the predictions included all 3 groups of variables collected by telemonitoring, together with current smoking status: current symptoms, current and delayed physiological measures, and current and delayed self-reported medications.</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Predictive accuracy of hospital admission and use of corticosteroids of different definitions of exacerbation.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="410"/>
            <col width="120"/>
            <col width="220"/>
            <col width="120"/>
            <col width="100"/>
            <thead>
              <tr valign="bottom">
                <td colspan="2">Description</td>
                <td>Practical</td>
                <td>AUC<sup>a</sup> (empirical 95% CI)</td>
                <td>Events, N<sup>+</sup></td>
                <td>Samples, N</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="6"><bold>Prediction of 24-hour admissions using exacerbation definitions, <italic>complete</italic> data</bold></td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Definition 1</td>
                <td>Yes</td>
                <td>0.600 (0.509-0.692)</td>
                <td>17</td>
                <td>17,610</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Definition 2</td>
                <td>Yes</td>
                <td>0.578 (0.496-0.672)</td>
                <td>17</td>
                <td>17,610</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Definition 3</td>
                <td>No</td>
                <td>0.553 (0.440-0.666)</td>
                <td>8</td>
                <td>14,106</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Definition 4</td>
                <td>No</td>
                <td>0.490 (0.424-0.556)</td>
                <td>8</td>
                <td>14,106</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Definition 5</td>
                <td>No</td>
                <td>0.657 (0.523-0.792)</td>
                <td>9</td>
                <td>16,170</td>
              </tr>
              <tr valign="top">
                <td colspan="6"><bold>Prediction of 24-hour admissions using exacerbation definitions, <italic>imputed</italic> data</bold></td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Definition 1</td>
                <td>Yes</td>
                <td>0.513 (0.477-0.551)</td>
                <td>55</td>
                <td>57,150</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Definition 2</td>
                <td>Yes</td>
                <td>0.524 (0.486-0.544)</td>
                <td>55</td>
                <td>57,150</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Definition 3</td>
                <td>No</td>
                <td>0.496 (0.471-0.521)</td>
                <td>55</td>
                <td>56,702</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Definition 4</td>
                <td>No</td>
                <td>0.505 (0.473-0.536)</td>
                <td>55</td>
                <td>56,702</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Definition 5</td>
                <td>No</td>
                <td>0.517 (0.479-0.555)</td>
                <td>55</td>
                <td>57,150</td>
              </tr>
              <tr valign="top">
                <td colspan="6"><bold>Prediction of 24-hour corticosteroid decisions using exacerbation definitions, <italic>complete</italic> data</bold></td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Definition 1</td>
                <td>Yes</td>
                <td>0.655 (0.630-0.679)</td>
                <td>238</td>
                <td>9768</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Definition 2</td>
                <td>Yes</td>
                <td>0.605 (0.581-0.628)</td>
                <td>238</td>
                <td>9768</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Definition 3</td>
                <td>No</td>
                <td>0.568 (0.544-0.592)</td>
                <td>178</td>
                <td>8489</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Definition 4</td>
                <td>No</td>
                <td>0.544 (0.522-0.567)</td>
                <td>178</td>
                <td>8489</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Definition 5</td>
                <td>No</td>
                <td>0.646 (0.622-0.670)</td>
                <td>237</td>
                <td>9322</td>
              </tr>
              <tr valign="top">
                <td colspan="6"><bold>Prediction of 24-hour corticosteroid decisions using exacerbation definitions, <italic>imputed</italic> data</bold></td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Definition 1</td>
                <td>Yes</td>
                <td>0.660 (0.639-0.681)</td>
                <td>316</td>
                <td>13,899</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Definition 2</td>
                <td>Yes</td>
                <td>0.605 (0.585-0.625)</td>
                <td>316</td>
                <td>13,899</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Definition 3</td>
                <td>No</td>
                <td>0.564 (0.543-0.586)</td>
                <td>228</td>
                <td>10,442</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Definition 4</td>
                <td>No</td>
                <td>0.543 (0.524-0.564)</td>
                <td>228</td>
                <td>10,442</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Definition 5</td>
                <td>No</td>
                <td>0.647 (0.626-0.668)</td>
                <td>316</td>
                <td>12,477</td>
              </tr>
              <tr valign="top">
                <td colspan="6"><bold>Prediction of 24-hour admissions using machine learning models, <italic>imputed</italic> data</bold></td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Machine learning model</td>
                <td>Yes</td>
                <td>0.740 (0.673-0.803)</td>
                <td>55</td>
                <td>57,150</td>
              </tr>
              <tr valign="top">
                <td colspan="6"><bold>Prediction of 24-hour corticosteroid decisions using exacerbation definitions, <italic>imputed</italic> data</bold></td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Machine learning model</td>
                <td>Yes</td>
                <td>0.765 (0.738-0.791)</td>
                <td>316</td>
                <td>13,503</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>AUC: area under the receiver operating characteristic curve.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Predicting Peaks in Symptom Scores in Populations</title>
        <p>The Healthy Outlook [<xref ref-type="bibr" rid="ref18">18</xref>] algorithm and the weather variables did not improve the quality of predictions of hospital admissions for individuals in our dataset. However, at the population level we found that, over some contiguous time periods, predominantly during fall and winter, prediction of the 2-week population-averaged baseline-adjusted symptom score using the Healthy Outlook variables outperformed the prediction of the simple delayed baseline-adjusted symptom score. The Spearman correlation between the true and the predicted outcomes over the test data folds increased from 0.44-0.55 (the lagged heuristic) to 0.66-0.75 (Healthy Outlook), and the Kendall rank correlation increased from 0.27-0.38 to 0.44-0.52. See <xref ref-type="app" rid="app1">Multimedia Appendix 1</xref> for additional detail.</p>
      </sec>
      <sec>
        <title>Predicting Individuals Starting Corticosteroids</title>
        <p>In contrast to the prediction of hospital admissions, the standard score-counting algorithms were moderately predictive of decisions to start corticosteroid treatments, both in the complete-data and in the imputed-data scenario. Here, we included in the analysis only episodes where patients reported not taking corticosteroids on the first day of the exacerbation. The onset events were defined as taking corticosteroids on the following day. Using definition 1 (<xref ref-type="boxed-text" rid="box1">Textbox 1</xref>), we obtained an AUC of 0.655 (95% CI 0.630-0.679) for the complete-data scenario with N=9768 episodes and N<sup>+</sup>=238 corticosteroid therapy onsets (<xref ref-type="table" rid="table1">Table 1</xref>). In the imputed-data scenario, we obtained an AUC of 0.660 (95% CI 0.639-0.681) with N=13,899 episodes and N<sup>+</sup>=316 corticosteroid therapy onsets. Although the machine learning models helped to improve the predictions, leading to an AUC of 0.765 (95% CI 0.738-0.791) on the test datasets, this improvement was relatively lower than in the case of predicting the admissions. The algorithm for predicting corticosteroid onsets (a nonparametric model) used 153 features, where the most important one, as suggested by linearizing, was the total symptom score on the current day.</p>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Results</title>
        <p>In the context of telemonitoring, traditional algorithms of predicting exacerbations with imputation of missing symptom data were no better than chance when they were used for predicting a COPD admission over the subsequent 24 hours, and were only a little better than chance in the subset with complete data provided by patients. The performance of machine learning algorithms was considerably more accurate and, in practice and subject to some conditions, would have halved the number of false alerts in comparison with the traditional method (see <xref ref-type="app" rid="app1">Multimedia Appendix 1</xref> for additional detail). The algorithm readily identified those at high and low risk of admission, suggesting that, in a resource-constrained environment, a simple triage strategy for targeting additional care could be based on using the output of our method. Adding meteorological data did not significantly enhance the accuracy of the model at an individual level, although it did so, to some extent, at a group level for the prediction of average baseline-adjusted symptom scores, which could be of value to service planners. We found that both the standard symptom-counting algorithms and the machine learning algorithms were reasonably accurate for predicting the decision to start corticosteroids within 24 hours.</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>Despite the Telescot COPD trial [<xref ref-type="bibr" rid="ref11">11</xref>] being one of the largest individually randomized trials of telehealth in COPD, the absolute number of admissions immediately preceded by a complete record of physiological and symptom variables was relatively small, which may have reduced the reliability of the algorithm.</p>
        <p>The lack of a gold standard definition for what constitutes an exacerbation is a challenge to research in this area. Many mild to moderate exacerbations were defined by medication use, and patients’ individualized management plans advised commencement of antibiotics with an increase in symptoms (eg, if their sputum was dark green). Some also kept corticosteroids, which they took if they were very breathless or wheezy. This self-management may have interfered with what would otherwise have been the natural history of the exacerbation, reducing the relationship between some symptoms and signs and the outcome (hospital admission), but potentially strengthening the relationship between some components of the algorithm and decision to start corticosteroids. Nonetheless, we find the fact that the machine learning algorithm can predict future admissions despite adjusting for self-reported medications to be encouraging.</p>
        <p>One methodological limitation of our approach is its reliance on cross-validation, rather than multiple independent cohorts, for evaluations of the predictive performance. In addition to ignoring possible covariate or distribution shifts across multiple cohorts, another well-known disadvantage of cross-validation is the complexity of approximating confidence intervals of the performance measures [<xref ref-type="bibr" rid="ref34">34</xref>], especially for small or imbalanced datasets. The use of a resampling approach such as cross-validation was unavoidable given the small number of large telemonitoring trials for COPD. Further validations in unrelated datasets will be needed to confirm our findings. One strength of our approach is the use of complementary machine learning methods in the derivation of the optimal algorithm and consistency of the findings across the methods. The considered methods included regularized parametric and kernel methods, boosting, and representation learning. A limitation of our approach is its reliance on fixed-length feature vectors extracted from time-series data, rather than variable-length predictors. We argue that, although there have been some recent works on using variable-length approaches for time-series predictions [<xref ref-type="bibr" rid="ref35">35</xref>], they demonstrated superior performance over other methods when the number of cases exceeded ours by several orders of magnitude, and they were not extensively compared with sparse classifiers reliant on imputation methods. The closest match to such models from those we considered—the long short-term memory with the imputation strategy described above—did not improve on the other models. Handling the systematic missingness in variable-length conditional models is an actively researched area that will be considered in the future, and which is likely to become useful once bigger telemonitoring datasets are collected. In this study, we used imputation by forward-feeding, which is arguably one of the most practical approaches at the point of inference when access to past data is limited; other techniques may potentially be considered.</p>
        <p>The aim of this study was to demonstrate the potential of machine learning for predicting COPD admissions and corticosteroid use, not to elucidate the effects of each feature or combination of features under different adjustments. Modern artificial intelligence methods for predicting clinical events use hundreds or even thousands of features to predict clinical outcomes [<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref36">36</xref>]. Due to complex architectures and interactions between multiple variables, it is challenging to estimate the effects of each feature [<xref ref-type="bibr" rid="ref37">37</xref>,<xref ref-type="bibr" rid="ref38">38</xref>]. In this study, we investigated the effects only of classes of variables (telehealth, weather-related, and their combinations) rather than each single variable. This is a general limitation of high-dimensional methods; future work is needed to investigate the marginal and conditional effects, and a validation in a device trial will be needed prior to translation to clinical practice.</p>
        <p>A limitation of our work is that some of the measures were available at only 1 or 2 time points (eg, anxiety and depression scores, quality of life, exercise or physical activity data, and smoking status were assessed at the beginning and end of the 1-year trial), and time-series data might have been more informative. Other multicomponent scores known to be predictive of COPD outcomes (such as the body mass index, obstruction, dyspnea, exercise index [<xref ref-type="bibr" rid="ref39">39</xref>] or dyspnea, obstruction, smoking, exacerbation index [<xref ref-type="bibr" rid="ref40">40</xref>]) might have been useful predictors, as would serial FEV<sub>1</sub> and more detailed serial information on medication changes. Our machine learning platform is extendable to such new types of data sources that may include systematic or informative missingness, which is the strength of the approach.</p>
      </sec>
      <sec>
        <title>Comparison With Prior Work</title>
        <p>Interest in the development of more accurate predictive algorithms using machine learning is increasing; Sanchez-Morillo and colleagues [<xref ref-type="bibr" rid="ref41">41</xref>] in a recent review concluded that, while some of these show promise, they have been based on relatively small numbers of patients and events [<xref ref-type="bibr" rid="ref42">42</xref>,<xref ref-type="bibr" rid="ref43">43</xref>]. They require validation in larger samples of patients, for longer periods of time. The closest to ours is probably the very recent work of Shah et al [<xref ref-type="bibr" rid="ref44">44</xref>], who used logistic regression to predict future exacerbations and showed that using pulse rate, oxygen saturation, and respiratory rate (from a pulse oximeter) showed improved predictivity when compared with traditional algorithms of COPD exacerbations. Our result in respect of the value of meteorological data is consistent with the work of Steventon et al [<xref ref-type="bibr" rid="ref45">45</xref>] on the impact of Healthy Outlook on admission rates.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>The early detection and management of COPD remains an important goal given the huge personal and economic costs of the condition. Machine learning approaches, which can be tailored to an individual’s baseline profile and can learn from experience of the individual patient, show promise in achieving this goal. There is a need for larger datasets with which to develop more accurate algorithms; however, the lack of an effect of telehealth in COPD demonstrated in trials has effectively discouraged large implementations of the technology. One solution (if governance regulations can be overcome) is to amalgamate existing international datasets. Another may be to explore the ability of algorithms to predict moderate (nonhospitalized) exacerbations with all the challenges highlighted above. Additionally, the potential of machine learning to elucidate optimal interventions should be explored.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <app id="app1">
        <title>Multimedia Appendix 1</title>
        <p>Supplementary data.</p>
        <media xlink:href="jmir_v20i9e263_app1.pdf" xlink:title="PDF File (Adobe PDF File), 665KB"/>
      </app>
      <app id="app2">
        <title>Multimedia Appendix 2</title>
        <p>Receiver operating characteristic (ROC) of the multitask neural net (MTNN) and the symptom-counting exacerbation score (after [2]) for prediction of 24-hour admissions using the imputed data scenario. The areas under the mean aggregate ROC curves over test data are ~0.74 and ~0.52 respectively.</p>
        <media xlink:href="jmir_v20i9e263_app2.png" xlink:title="PNG File, 69KB"/>
      </app>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">AUC</term>
          <def>
            <p>area under the receiver operating characteristic curve</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">COPD</term>
          <def>
            <p>chronic obstructive pulmonary disease</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">FEV 
          <sub>1</sub></term>
          <def>
            <p>forced expiratory volume in the first second of expiration</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">NHS</term>
          <def>
            <p>National Health Service</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">UK</term>
          <def>
            <p>United Kingdom</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>This work was funded by a UK Medical Research Council Confidence in Concept grant and further supported by an Innovate UK grant. The original data collection was supported by the Scottish Government Chief Scientist Office. Additional financial support was received from the Edinburgh Clinical Trials Unit. This work could not have been completed without the participating patients and clinicians from NHS Lothian.</p>
    </ack>
    <fn-group>
      <fn fn-type="conflict">
        <p>FA is founder and stakeholder at Pharmatics Ltd. CS is an employee of the Met Office, a Trading Fund of the Department for Business, Energy and Industrial Strategy.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Guarascio</surname>
            <given-names>AJ</given-names>
          </name>
          <name name-style="western">
            <surname>Ray</surname>
            <given-names>SM</given-names>
          </name>
          <name name-style="western">
            <surname>Finch</surname>
            <given-names>CK</given-names>
          </name>
          <name name-style="western">
            <surname>Self</surname>
            <given-names>TH</given-names>
          </name>
        </person-group>
        <article-title>The clinical and economic burden of chronic obstructive pulmonary disease in the USA</article-title>
        <source>Clinicoecon Outcomes Res</source>  
        <year>2013</year>  
        <volume>5</volume>  
        <fpage>235</fpage>  
        <lpage>45</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://dx.doi.org/10.2147/CEOR.S34321"/>
        </comment>  
        <pub-id pub-id-type="doi">10.2147/CEOR.S34321</pub-id>
        <pub-id pub-id-type="medline">23818799</pub-id>
        <pub-id pub-id-type="pii">ceor-5-235</pub-id>
        <pub-id pub-id-type="pmcid">PMC3694800</pub-id></nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Seemungal</surname>
            <given-names>TA</given-names>
          </name>
          <name name-style="western">
            <surname>Donaldson</surname>
            <given-names>GC</given-names>
          </name>
          <name name-style="western">
            <surname>Bhowmik</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Jeffries</surname>
            <given-names>DJ</given-names>
          </name>
          <name name-style="western">
            <surname>Wedzicha</surname>
            <given-names>JA</given-names>
          </name>
        </person-group>
        <article-title>Time course and recovery of exacerbations in patients with chronic obstructive pulmonary disease</article-title>
        <source>Am J Respir Crit Care Med</source>  
        <year>2000</year>  
        <month>05</month>  
        <volume>161</volume>  
        <issue>5</issue>  
        <fpage>1608</fpage>  
        <lpage>13</lpage>  
        <pub-id pub-id-type="doi">10.1164/ajrccm.161.5.9908022</pub-id>
        <pub-id pub-id-type="medline">10806163</pub-id></nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Seemungal</surname>
            <given-names>TA</given-names>
          </name>
          <name name-style="western">
            <surname>Donaldson</surname>
            <given-names>GC</given-names>
          </name>
          <name name-style="western">
            <surname>Paul</surname>
            <given-names>EA</given-names>
          </name>
          <name name-style="western">
            <surname>Bestall</surname>
            <given-names>JC</given-names>
          </name>
          <name name-style="western">
            <surname>Jeffries</surname>
            <given-names>DJ</given-names>
          </name>
          <name name-style="western">
            <surname>Wedzicha</surname>
            <given-names>JA</given-names>
          </name>
        </person-group>
        <article-title>Effect of exacerbation on quality of life in patients with chronic obstructive pulmonary disease</article-title>
        <source>Am J Respir Crit Care Med</source>  
        <year>1998</year>  
        <month>05</month>  
        <volume>157</volume>  
        <issue>5 Pt 1</issue>  
        <fpage>1418</fpage>  
        <lpage>22</lpage>  
        <pub-id pub-id-type="doi">10.1164/ajrccm.157.5.9709032</pub-id>
        <pub-id pub-id-type="medline">9603117</pub-id></nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Ure</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Pinnock</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Hanley</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Kidd</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>McCall</surname>
            <given-names>SE</given-names>
          </name>
          <name name-style="western">
            <surname>Tarling</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Pagliari</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Sheikh</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>MacNee</surname>
            <given-names>W</given-names>
          </name>
          <name name-style="western">
            <surname>McKinstry</surname>
            <given-names>B</given-names>
          </name>
        </person-group>
        <article-title>Piloting tele-monitoring in COPD: a mixed methods exploration of issues in design and implementation</article-title>
        <source>Prim Care Respir J</source>  
        <year>2012</year>  
        <month>03</month>  
        <volume>21</volume>  
        <issue>1</issue>  
        <fpage>57</fpage>  
        <lpage>64</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://dx.doi.org/10.4104/pcrj.2011.00065"/>
        </comment>  
        <pub-id pub-id-type="doi">10.4104/pcrj.2011.00065</pub-id>
        <pub-id pub-id-type="medline">21785816</pub-id>
        <pub-id pub-id-type="pii">pcrj-2010-11-0132-R1</pub-id></nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>McLean</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Nurmatov</surname>
            <given-names>U</given-names>
          </name>
          <name name-style="western">
            <surname>Liu</surname>
            <given-names>JL</given-names>
          </name>
          <name name-style="western">
            <surname>Pagliari</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Car</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Sheikh</surname>
            <given-names>A</given-names>
          </name>
        </person-group>
        <article-title>Telehealthcare for chronic obstructive pulmonary disease</article-title>
        <source>Cochrane Database Syst Rev</source>  
        <year>2011</year>  
        <issue>7</issue>  
        <fpage>CD007718</fpage>  
        <pub-id pub-id-type="doi">10.1002/14651858.CD007718.pub2</pub-id>
        <pub-id pub-id-type="medline">21735417</pub-id></nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Polisena</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Tran</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Cimon</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Hutton</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>McGill</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Palmer</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Scott</surname>
            <given-names>RE</given-names>
          </name>
        </person-group>
        <article-title>Home telehealth for chronic obstructive pulmonary disease: a systematic review and meta-analysis</article-title>
        <source>J Telemed Telecare</source>  
        <year>2010</year>  
        <volume>16</volume>  
        <issue>3</issue>  
        <fpage>120</fpage>  
        <lpage>7</lpage>  
        <pub-id pub-id-type="doi">10.1258/jtt.2009.090812</pub-id>
        <pub-id pub-id-type="medline">20197355</pub-id>
        <pub-id pub-id-type="pii">jtt.2009.090812</pub-id></nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Bolton</surname>
            <given-names>CE</given-names>
          </name>
          <name name-style="western">
            <surname>Waters</surname>
            <given-names>CS</given-names>
          </name>
          <name name-style="western">
            <surname>Peirce</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Elwyn</surname>
            <given-names>G</given-names>
          </name>
        </person-group>
        <article-title>Insufficient evidence of benefit: a systematic review of home telemonitoring for COPD</article-title>
        <source>J Eval Clin Pract</source>  
        <year>2011</year>  
        <month>12</month>  
        <volume>17</volume>  
        <issue>6</issue>  
        <fpage>1216</fpage>  
        <lpage>22</lpage>  
        <pub-id pub-id-type="doi">10.1111/j.1365-2753.2010.01536.x</pub-id>
        <pub-id pub-id-type="medline">20846317</pub-id></nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Steventon</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Bardsley</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Billings</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Dixon</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Doll</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Hirani</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Cartwright</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Rixon</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Knapp</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Henderson</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Rogers</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Fitzpatrick</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Hendy</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Newman</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Whole</surname>
            <given-names>SDET</given-names>
          </name>
        </person-group>
        <article-title>Effect of telehealth on use of secondary care and mortality: findings from the Whole System Demonstrator cluster randomised trial</article-title>
        <source>BMJ</source>  
        <year>2012</year>  
        <volume>344</volume>  
        <fpage>e3874</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://www.bmj.com/cgi/pmidlookup?view=long&#38;pmid=22723612"/>
        </comment>  
        <pub-id pub-id-type="medline">22723612</pub-id>
        <pub-id pub-id-type="pmcid">PMC3381047</pub-id></nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Pinnock</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Hanley</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Lewis</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>MacNee</surname>
            <given-names>W</given-names>
          </name>
          <name name-style="western">
            <surname>Pagliari</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>van der Pol</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Sheikh</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>McKinstry</surname>
            <given-names>B</given-names>
          </name>
          <collab>TELESCOT Programme Group</collab>
        </person-group>
        <article-title>The impact of a telemetric chronic obstructive pulmonary disease monitoring service: randomised controlled trial with economic evaluation and nested qualitative study</article-title>
        <source>Prim Care Respir J</source>  
        <year>2009</year>  
        <month>09</month>  
        <volume>18</volume>  
        <issue>3</issue>  
        <fpage>233</fpage>  
        <lpage>5</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.doi.org/10.4104/pcrj.2009.00040"/>
        </comment>  
        <pub-id pub-id-type="doi">10.4104/pcrj.2009.00040</pub-id>
        <pub-id pub-id-type="medline">19588056</pub-id>
        <pub-id pub-id-type="pii">RHI-007-09</pub-id></nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Rodriguez-Roisin</surname>
            <given-names>R</given-names>
          </name>
        </person-group>
        <article-title>Toward a consensus definition for COPD exacerbations</article-title>
        <source>Chest</source>  
        <year>2000</year>  
        <month>05</month>  
        <volume>117</volume>  
        <issue>5 Suppl 2</issue>  
        <fpage>398S</fpage>  
        <lpage>401S</lpage>  
        <pub-id pub-id-type="medline">10843984</pub-id>
        <pub-id pub-id-type="pii">S0012-3692(15)32859-2</pub-id></nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Pinnock</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Hanley</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>McCloughan</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Todd</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Krishan</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Lewis</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Stoddart</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>van</surname>
            <given-names>DPM</given-names>
          </name>
          <name name-style="western">
            <surname>MacNee</surname>
            <given-names>W</given-names>
          </name>
          <name name-style="western">
            <surname>Sheikh</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Pagliari</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>McKinstry</surname>
            <given-names>B</given-names>
          </name>
        </person-group>
        <article-title>Effectiveness of telemonitoring integrated into existing clinical services on hospital admission for exacerbation of chronic obstructive pulmonary disease: researcher blind, multicentre, randomised controlled trial</article-title>
        <source>BMJ</source>  
        <year>2013</year>  
        <volume>347</volume>  
        <fpage>f6070</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://www.bmj.com/cgi/pmidlookup?view=long&#38;pmid=24136634"/>
        </comment>  
        <pub-id pub-id-type="medline">24136634</pub-id>
        <pub-id pub-id-type="pmcid">PMC3805483</pub-id></nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Leidy</surname>
            <given-names>NK</given-names>
          </name>
          <name name-style="western">
            <surname>Wilcox</surname>
            <given-names>TK</given-names>
          </name>
          <name name-style="western">
            <surname>Jones</surname>
            <given-names>PW</given-names>
          </name>
          <name name-style="western">
            <surname>Roberts</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Powers</surname>
            <given-names>JH</given-names>
          </name>
          <name name-style="western">
            <surname>Sethi</surname>
            <given-names>S</given-names>
          </name>
          <collab>EXACT-PRO Study Group</collab>
        </person-group>
        <article-title>Standardizing measurement of chronic obstructive pulmonary disease exacerbations. Reliability and validity of a patient-reported diary</article-title>
        <source>Am J Respir Crit Care Med</source>  
        <year>2011</year>  
        <month>02</month>  
        <day>01</day>  
        <volume>183</volume>  
        <issue>3</issue>  
        <fpage>323</fpage>  
        <lpage>9</lpage>  
        <pub-id pub-id-type="doi">10.1164/rccm.201005-0762OC</pub-id>
        <pub-id pub-id-type="medline">20813886</pub-id>
        <pub-id pub-id-type="pii">201005-0762OC</pub-id></nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Jones</surname>
            <given-names>PW</given-names>
          </name>
          <name name-style="western">
            <surname>Harding</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Berry</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Wiklund</surname>
            <given-names>I</given-names>
          </name>
          <name name-style="western">
            <surname>Chen</surname>
            <given-names>W</given-names>
          </name>
          <name name-style="western">
            <surname>Kline</surname>
            <given-names>LN</given-names>
          </name>
        </person-group>
        <article-title>Development and first validation of the COPD Assessment Test</article-title>
        <source>Eur Respir J</source>  
        <year>2009</year>  
        <month>09</month>  
        <volume>34</volume>  
        <issue>3</issue>  
        <fpage>648</fpage>  
        <lpage>54</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://erj.ersjournals.com/cgi/pmidlookup?view=long&#38;pmid=19720809"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1183/09031936.00102509</pub-id>
        <pub-id pub-id-type="medline">19720809</pub-id>
        <pub-id pub-id-type="pii">34/3/648</pub-id></nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Hurst</surname>
            <given-names>JR</given-names>
          </name>
          <name name-style="western">
            <surname>Donaldson</surname>
            <given-names>GC</given-names>
          </name>
          <name name-style="western">
            <surname>Quint</surname>
            <given-names>JK</given-names>
          </name>
          <name name-style="western">
            <surname>Goldring</surname>
            <given-names>JJP</given-names>
          </name>
          <name name-style="western">
            <surname>Patel</surname>
            <given-names>ARC</given-names>
          </name>
          <name name-style="western">
            <surname>Wedzicha</surname>
            <given-names>JA</given-names>
          </name>
        </person-group>
        <article-title>Domiciliary pulse-oximetry at exacerbation of chronic obstructive pulmonary disease: prospective pilot study</article-title>
        <source>BMC Pulm Med</source>  
        <year>2010</year>  
        <month>10</month>  
        <day>20</day>  
        <volume>10</volume>  
        <fpage>52</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcpulmmed.biomedcentral.com/articles/10.1186/1471-2466-10-52"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1186/1471-2466-10-52</pub-id>
        <pub-id pub-id-type="medline">20961450</pub-id>
        <pub-id pub-id-type="pii">1471-2466-10-52</pub-id>
        <pub-id pub-id-type="pmcid">PMC2978135</pub-id></nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Burton</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Pinnock</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>McKinstry</surname>
            <given-names>B</given-names>
          </name>
        </person-group>
        <article-title>Changes in telemonitored physiological variables and symptoms prior to exacerbations of chronic obstructive pulmonary disease</article-title>
        <source>J Telemed Telecare</source>  
        <year>2015</year>  
        <month>01</month>  
        <volume>21</volume>  
        <issue>1</issue>  
        <fpage>29</fpage>  
        <lpage>36</lpage>  
        <pub-id pub-id-type="doi">10.1177/1357633X14562733</pub-id>
        <pub-id pub-id-type="medline">25475218</pub-id>
        <pub-id pub-id-type="pii">1357633X14562733</pub-id></nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="book">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Goodfellow</surname>
            <given-names>I</given-names>
          </name>
          <name name-style="western">
            <surname>Bengio</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Courville</surname>
            <given-names>A</given-names>
          </name>
        </person-group>
        <source>Deep Learning</source>  
        <year>2016</year>  
        <publisher-loc>Cambridge, MA</publisher-loc>
        <publisher-name>MIT Press</publisher-name></nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="book">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Hastie</surname>
            <given-names>T</given-names>
          </name>
          <name name-style="western">
            <surname>Tibshirani</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Friedman</surname>
            <given-names>J</given-names>
          </name>
        </person-group>
        <source>The Elements of Statistical Learning: Data Mining, Inference, and Prediction. 2nd edition</source>  
        <year>2011</year>  
        <publisher-loc>New York, NY</publisher-loc>
        <publisher-name>Springer</publisher-name></nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Sarran</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Halpin</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Levy</surname>
            <given-names>ML</given-names>
          </name>
          <name name-style="western">
            <surname>Prigmore</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Sachon</surname>
            <given-names>P</given-names>
          </name>
        </person-group>
        <article-title>A retrospective study of the impact of a telephone alert service (Healthy Outlook) on hospital admissions for patients with chronic obstructive pulmonary disease</article-title>
        <source>NPJ Prim Care Respir Med</source>  
        <year>2014</year>  
        <month>10</month>  
        <day>23</day>  
        <volume>24</volume>  
        <fpage>14080</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/25340279"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1038/npjpcrm.2014.80</pub-id>
        <pub-id pub-id-type="medline">25340279</pub-id>
        <pub-id pub-id-type="pii">npjpcrm201480</pub-id>
        <pub-id pub-id-type="pmcid">PMC4373472</pub-id></nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Anthonisen</surname>
            <given-names>NR</given-names>
          </name>
          <name name-style="western">
            <surname>Manfreda</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Warren</surname>
            <given-names>CP</given-names>
          </name>
          <name name-style="western">
            <surname>Hershfield</surname>
            <given-names>ES</given-names>
          </name>
          <name name-style="western">
            <surname>Harding</surname>
            <given-names>GK</given-names>
          </name>
          <name name-style="western">
            <surname>Nelson</surname>
            <given-names>NA</given-names>
          </name>
        </person-group>
        <article-title>Antibiotic therapy in exacerbations of chronic obstructive pulmonary disease</article-title>
        <source>Ann Intern Med</source>  
        <year>1987</year>  
        <month>02</month>  
        <volume>106</volume>  
        <issue>2</issue>  
        <fpage>196</fpage>  
        <lpage>204</lpage>  
        <pub-id pub-id-type="medline">3492164</pub-id></nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Bestall</surname>
            <given-names>JC</given-names>
          </name>
          <name name-style="western">
            <surname>Paul</surname>
            <given-names>EA</given-names>
          </name>
          <name name-style="western">
            <surname>Garrod</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Garnham</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Jones</surname>
            <given-names>PW</given-names>
          </name>
          <name name-style="western">
            <surname>Wedzicha</surname>
            <given-names>JA</given-names>
          </name>
        </person-group>
        <article-title>Usefulness of the Medical Research Council (MRC) dyspnoea scale as a measure of disability in patients with chronic obstructive pulmonary disease</article-title>
        <source>Thorax</source>  
        <year>1999</year>  
        <month>07</month>  
        <volume>54</volume>  
        <issue>7</issue>  
        <fpage>581</fpage>  
        <lpage>6</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://thorax.bmj.com/cgi/pmidlookup?view=long&#38;pmid=10377201"/>
        </comment>  
        <pub-id pub-id-type="medline">10377201</pub-id>
        <pub-id pub-id-type="pmcid">PMC1745516</pub-id></nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Zigmond</surname>
            <given-names>AS</given-names>
          </name>
          <name name-style="western">
            <surname>Snaith</surname>
            <given-names>RP</given-names>
          </name>
        </person-group>
        <article-title>The hospital anxiety and depression scale</article-title>
        <source>Acta Psychiatr Scand</source>  
        <year>1983</year>  
        <month>06</month>  
        <volume>67</volume>  
        <issue>6</issue>  
        <fpage>361</fpage>  
        <lpage>70</lpage>  
        <pub-id pub-id-type="medline">6880820</pub-id></nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Jones</surname>
            <given-names>PW</given-names>
          </name>
        </person-group>
        <article-title>St. George's Respiratory Questionnaire: MCID</article-title>
        <source>COPD</source>  
        <year>2005</year>  
        <month>03</month>  
        <volume>2</volume>  
        <issue>1</issue>  
        <fpage>75</fpage>  
        <lpage>9</lpage>  
        <pub-id pub-id-type="medline">17136966</pub-id></nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="book">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Geurts</surname>
            <given-names>P</given-names>
          </name>
        </person-group>
        <person-group person-group-type="editor">
          <name name-style="western">
            <surname>De Raedt</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Siebes</surname>
            <given-names>A</given-names>
          </name>
        </person-group>
        <article-title>Pattern extraction for time series classification</article-title>
        <source>Principles of Data Mining and Knowledge Discovery</source>  
        <year>2001</year>  
        <publisher-loc>Berlin, Germany</publisher-loc>
        <publisher-name>Springer</publisher-name>
        <fpage>115</fpage>  
        <lpage>127</lpage> </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Caruana</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Lou</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Gehrke</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Koch</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Elhadad</surname>
            <given-names>N</given-names>
          </name>
        </person-group>
        <article-title>Intelligible models for healthcare: predicting pneumonia risk and hospital 30-day readmission</article-title>
        <year>2015</year>  
        <conf-name>21st ACM SIGKDD International Conference on Knowledge Discovery and Data Mining</conf-name>
        <conf-date>Aug 10-13, 2015</conf-date>
        <conf-loc>Sydney, Australia</conf-loc>
        <fpage>1721</fpage>  
        <lpage>1730</lpage>  
        <pub-id pub-id-type="doi">10.1145/2783258.2788613</pub-id></nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Guyon</surname>
            <given-names>I</given-names>
          </name>
          <name name-style="western">
            <surname>Elisseeff</surname>
            <given-names>A</given-names>
          </name>
        </person-group>
        <article-title>An introduction to variable and feature selection</article-title>
        <source>J Mach Learn Res</source>  
        <year>2003</year>  
        <volume>3</volume>  
        <fpage>1157</fpage>  
        <lpage>82</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://www.jmlr.org/papers/volume3/guyon03a/guyon03a.pdf"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="book">
        <person-group person-group-type="author">
          <collab>Counseil du medicament Quebec</collab>
        </person-group>
        <source>[Acute Bronchitis and Acute Exacerbation of Chronic Obstructive Pulmonary Disease, Clinical Guide]</source>  
        <year>2009</year>  
        <month>10</month>  
        <publisher-loc>Quebec, QC</publisher-loc>
        <publisher-name>Institut national d'excellence en santé et en services sociaux</publisher-name></nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Wilkinson</surname>
            <given-names>TMA</given-names>
          </name>
          <name name-style="western">
            <surname>Donaldson</surname>
            <given-names>GC</given-names>
          </name>
          <name name-style="western">
            <surname>Hurst</surname>
            <given-names>JR</given-names>
          </name>
          <name name-style="western">
            <surname>Seemungal</surname>
            <given-names>TAR</given-names>
          </name>
          <name name-style="western">
            <surname>Wedzicha</surname>
            <given-names>JA</given-names>
          </name>
        </person-group>
        <article-title>Early therapy improves outcomes of exacerbations of chronic obstructive pulmonary disease</article-title>
        <source>Am J Respir Crit Care Med</source>  
        <year>2004</year>  
        <month>06</month>  
        <day>15</day>  
        <volume>169</volume>  
        <issue>12</issue>  
        <fpage>1298</fpage>  
        <lpage>303</lpage>  
        <pub-id pub-id-type="doi">10.1164/rccm.200310-1443OC</pub-id>
        <pub-id pub-id-type="medline">14990395</pub-id>
        <pub-id pub-id-type="pii">200310-1443OC</pub-id></nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Bonilla</surname>
            <given-names>E</given-names>
          </name>
          <name name-style="western">
            <surname>Agakov</surname>
            <given-names>F</given-names>
          </name>
          <name name-style="western">
            <surname>Williams</surname>
            <given-names>C</given-names>
          </name>
        </person-group>
        <article-title>Kernel multi-task learning using task-specific features</article-title>
        <year>2007</year>  
        <conf-name>Eleventh International Conference on Artificial Intelligence and Statistics (AISTATS 2007)</conf-name>
        <conf-date>Mar 21-24, 2007</conf-date>
        <conf-loc>San Juan, Puerto Rico</conf-loc>
        <fpage>43</fpage>  
        <lpage>50</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://proceedings.mlr.press/v2/bonilla07a/bonilla07a.pdf"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Fan</surname>
            <given-names>RE</given-names>
          </name>
          <name name-style="western">
            <surname>Chang</surname>
            <given-names>KW</given-names>
          </name>
          <name name-style="western">
            <surname>Hsieh</surname>
            <given-names>CJ</given-names>
          </name>
          <name name-style="western">
            <surname>Wang</surname>
            <given-names>XR</given-names>
          </name>
          <name name-style="western">
            <surname>Lin</surname>
            <given-names>CJ</given-names>
          </name>
        </person-group>
        <article-title>LIBLINEAR: a library for large linear classification</article-title>
        <source>J Mach Learn Res</source>  
        <year>2008</year>  
        <volume>9</volume>  
        <fpage>1871</fpage>  
        <lpage>1874</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://www.jmlr.org/papers/volume9/fan08a/fan08a.pdf"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Zou</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Hastie</surname>
            <given-names>T</given-names>
          </name>
        </person-group>
        <article-title>Regularization variable selection via the elastic net</article-title>
        <source>J Royal Stat Soc B</source>  
        <year>2005</year>  
        <volume>67</volume>  
        <issue>2</issue>  
        <fpage>301</fpage>  
        <lpage>20</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://rss.onlinelibrary.wiley.com/doi/epdf/10.1111/j.1467-9868.2005.00503.x"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Galar</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Fernandez</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Barrenechea</surname>
            <given-names>E</given-names>
          </name>
          <name name-style="western">
            <surname>Bustince</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Herrera</surname>
            <given-names>F</given-names>
          </name>
        </person-group>
        <article-title>A review on ensembles for the class imbalance problem: bagging-, boosting-, and hybrid-based approaches</article-title>
        <source>IEEE Trans Syst Man Cybern Part C Appl Rev</source>  
        <year>2012</year>  
        <month>07</month>  
        <volume>42</volume>  
        <issue>4</issue>  
        <fpage>463</fpage>  
        <lpage>484</lpage>  
        <pub-id pub-id-type="doi">10.1109/TSMCC.2011.2161285</pub-id></nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Sak</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Senior</surname>
            <given-names>AW</given-names>
          </name>
          <name name-style="western">
            <surname>Beaufays</surname>
            <given-names>F</given-names>
          </name>
        </person-group>
        <source>Long short-term memory based recurrent neural network architectures for large vocabulary speech recognition</source>  
        <year>2014</year>  
        <access-date>2018-08-31</access-date>
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/pdf/1402.1128.pdf">https://arxiv.org/pdf/1402.1128.pdf</ext-link>
          <ext-link ext-link-type="webcite" xlink:href="7245Ofra9"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>DeLong</surname>
            <given-names>ER</given-names>
          </name>
          <name name-style="western">
            <surname>DeLong</surname>
            <given-names>DM</given-names>
          </name>
          <name name-style="western">
            <surname>Clarke-Pearson</surname>
            <given-names>DL</given-names>
          </name>
        </person-group>
        <article-title>Comparing the areas under two or more correlated receiver operating characteristic curves: a nonparamentric approach</article-title>
        <source>Biometrics</source>  
        <year>1988</year>  
        <month>09</month>  
        <volume>44</volume>  
        <issue>3</issue>  
        <fpage>837</fpage>  
        <pub-id pub-id-type="doi">10.2307/2531595</pub-id></nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Bengio</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Grandvalet</surname>
            <given-names>Y</given-names>
          </name>
        </person-group>
        <article-title>No unbiased estimator of the variance of k-fold cross-validation</article-title>
        <source>J Mach Learn Res</source>  
        <year>2004</year>  
        <volume>5</volume>  
        <fpage>1089</fpage>  
        <lpage>105</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://www.jmlr.org/papers/volume5/grandvalet04a/grandvalet04a.pdf"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Che</surname>
            <given-names>Z</given-names>
          </name>
          <name name-style="western">
            <surname>Purushotham</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Cho</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Sontag</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Liu</surname>
            <given-names>Y</given-names>
          </name>
        </person-group>
        <source>Recurrent neural networks for multivariate time series with missing values</source>  
        <year>2016</year>  
        <access-date>2018-08-30</access-date>
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/pdf/1606.01865.pdf">https://arxiv.org/pdf/1606.01865.pdf</ext-link>
          <ext-link ext-link-type="webcite" xlink:href="7245SQCgI"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Oh</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Makar</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Fusco</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>McCaffrey</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Rao</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Ryan</surname>
            <given-names>EE</given-names>
          </name>
          <name name-style="western">
            <surname>Washer</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>West</surname>
            <given-names>LR</given-names>
          </name>
          <name name-style="western">
            <surname>Young</surname>
            <given-names>VB</given-names>
          </name>
          <name name-style="western">
            <surname>Guttag</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Hooper</surname>
            <given-names>DC</given-names>
          </name>
          <name name-style="western">
            <surname>Shenoy</surname>
            <given-names>ES</given-names>
          </name>
          <name name-style="western">
            <surname>Wiens</surname>
            <given-names>J</given-names>
          </name>
        </person-group>
        <article-title>A generalizable, data-driven approach to predict daily risk of clostridium difficile infection at two large academic health centers</article-title>
        <source>Infect Control Hosp Epidemiol</source>  
        <year>2018</year>  
        <month>04</month>  
        <volume>39</volume>  
        <issue>4</issue>  
        <fpage>425</fpage>  
        <lpage>433</lpage>  
        <pub-id pub-id-type="doi">10.1017/ice.2018.16</pub-id>
        <pub-id pub-id-type="medline">29576042</pub-id>
        <pub-id pub-id-type="pii">S0899823X18000168</pub-id></nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="book">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Ribeiro</surname>
            <given-names>MT</given-names>
          </name>
          <name name-style="western">
            <surname>Singh</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Guestrin</surname>
            <given-names>C</given-names>
          </name>
        </person-group>
        <source>Why should I trust you? Explaining the predictions of any classifier. Proceedings of the 22nd ACM SIGKDD International Conference on Knowledge Discovery and Data Mining</source>  
        <year>2016</year>  
        <publisher-loc>New York, NY</publisher-loc>
        <publisher-name>Association for Computing Machinery</publisher-name>
        <fpage>1135</fpage>  
        <lpage>1144</lpage> </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Doshi-Velez</surname>
            <given-names>F</given-names>
          </name>
          <name name-style="western">
            <surname>Kim</surname>
            <given-names>B</given-names>
          </name>
        </person-group>
        <source>Towards a rigorous science of interpretable machine learning</source>  
        <year>2016</year>  
        <access-date>2018-08-30</access-date>
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/pdf/1702.08608.pdf">https://arxiv.org/pdf/1702.08608.pdf</ext-link>
          <ext-link ext-link-type="webcite" xlink:href="7245bauqG"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Esteban</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Quintana</surname>
            <given-names>JM</given-names>
          </name>
          <name name-style="western">
            <surname>Moraza</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Aburto</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Aguirre</surname>
            <given-names>U</given-names>
          </name>
          <name name-style="western">
            <surname>Aguirregomoscorta</surname>
            <given-names>JI</given-names>
          </name>
          <name name-style="western">
            <surname>Aizpiri</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Basualdo</surname>
            <given-names>LV</given-names>
          </name>
          <name name-style="western">
            <surname>Capelastegui</surname>
            <given-names>A</given-names>
          </name>
        </person-group>
        <article-title>BODE-Index vs HADO-score in chronic obstructive pulmonary disease: which one to use in general practice?</article-title>
        <source>BMC Med</source>  
        <year>2010</year>  
        <month>05</month>  
        <day>24</day>  
        <volume>8</volume>  
        <fpage>28</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedicine.biomedcentral.com/articles/10.1186/1741-7015-8-28"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1186/1741-7015-8-28</pub-id>
        <pub-id pub-id-type="medline">20497527</pub-id>
        <pub-id pub-id-type="pii">1741-7015-8-28</pub-id>
        <pub-id pub-id-type="pmcid">PMC2880999</pub-id></nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Sundh</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Janson</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Lisspers</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Ställberg</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Montgomery</surname>
            <given-names>S</given-names>
          </name>
        </person-group>
        <article-title>The Dyspnoea, Obstruction, Smoking, Exacerbation (DOSE) index is predictive of mortality in COPD</article-title>
        <source>Prim Care Respir J</source>  
        <year>2012</year>  
        <month>09</month>  
        <volume>21</volume>  
        <issue>3</issue>  
        <fpage>295</fpage>  
        <lpage>301</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.doi.org/10.4104/pcrj.2012.00054"/>
        </comment>  
        <pub-id pub-id-type="doi">10.4104/pcrj.2012.00054</pub-id>
        <pub-id pub-id-type="medline">22786813</pub-id>
        <pub-id pub-id-type="pii">pcrj-2012-04-0066</pub-id></nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Sanchez-Morillo</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Fernandez-Granero</surname>
            <given-names>MA</given-names>
          </name>
          <name name-style="western">
            <surname>Leon-Jimenez</surname>
            <given-names>A</given-names>
          </name>
        </person-group>
        <article-title>Use of predictive algorithms in-home monitoring of chronic obstructive pulmonary disease and asthma: a systematic review</article-title>
        <source>Chron Respir Dis</source>  
        <year>2016</year>  
        <month>08</month>  
        <volume>13</volume>  
        <issue>3</issue>  
        <fpage>264</fpage>  
        <lpage>83</lpage>  
        <pub-id pub-id-type="doi">10.1177/1479972316642365</pub-id>
        <pub-id pub-id-type="medline">27097638</pub-id>
        <pub-id pub-id-type="pii">1479972316642365</pub-id></nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="book">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Fernandez-Granero</surname>
            <given-names>MA</given-names>
          </name>
          <name name-style="western">
            <surname>Sanchez-Morillo</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Lopez-Gordo</surname>
            <given-names>MA</given-names>
          </name>
          <name name-style="western">
            <surname>Leon</surname>
            <given-names>A</given-names>
          </name>
        </person-group>
        <person-group person-group-type="editor">
          <name name-style="western">
            <surname>Ferrandez Vicente</surname>
            <given-names>JM</given-names>
          </name>
          <name name-style="western">
            <surname>Alverez-Sanchez</surname>
            <given-names>JR</given-names>
          </name>
          <name name-style="western">
            <surname>de la Paz Lopez</surname>
            <given-names>F</given-names>
          </name>
          <name name-style="western">
            <surname>Toledo-Moreo</surname>
            <given-names>FJ</given-names>
          </name>
          <name name-style="western">
            <surname>Adeli</surname>
            <given-names>J</given-names>
          </name>
        </person-group>
        <article-title>A machine learning approach to prediction of exacerbations of chronic obstructive pulmonary disease</article-title>
        <source>Artificial Computation in Biology and Medicine</source>  
        <year>2015</year>  
        <publisher-loc>Cham, Switzerland</publisher-loc>
        <publisher-name>Springer Nature Switzerland</publisher-name></nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Amalakuhan</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Kiljanek</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Parvathaneni</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Hester</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Cheriyath</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Fischman</surname>
            <given-names>D</given-names>
          </name>
        </person-group>
        <article-title>A prediction model for COPD readmissions: catching up, catching our breath, and improving a national problem</article-title>
        <source>J Community Hosp Intern Med Perspect</source>  
        <year>2012</year>  
        <volume>2</volume>  
        <issue>1</issue>  
        <fpage>1</fpage>  
        <lpage>7</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/23882354"/>
        </comment>  
        <pub-id pub-id-type="doi">10.3402/jchimp.v2i1.9915</pub-id>
        <pub-id pub-id-type="medline">23882354</pub-id>
        <pub-id pub-id-type="pii">9915</pub-id>
        <pub-id pub-id-type="pmcid">PMC3714087</pub-id></nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Shah</surname>
            <given-names>SA</given-names>
          </name>
          <name name-style="western">
            <surname>Velardo</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Farmer</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Tarassenko</surname>
            <given-names>L</given-names>
          </name>
        </person-group>
        <article-title>Exacerbations in chronic obstructive pulmonary disease: identification and prediction using a digital health system</article-title>
        <source>J Med Internet Res</source>  
        <year>2017</year>  
        <month>03</month>  
        <day>07</day>  
        <volume>19</volume>  
        <issue>3</issue>  
        <fpage>e69</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://www.jmir.org/2017/3/e69/"/>
        </comment>  
        <pub-id pub-id-type="doi">10.2196/jmir.7207</pub-id>
        <pub-id pub-id-type="medline">28270380</pub-id>
        <pub-id pub-id-type="pii">v19i3e69</pub-id>
        <pub-id pub-id-type="pmcid">PMC5360891</pub-id></nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Steventon</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Bardsley</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Mays</surname>
            <given-names>N</given-names>
          </name>
        </person-group>
        <article-title>Effect of a telephonic alert system (Healthy outlook) for patients with chronic obstructive pulmonary disease: a cohort study with matched controls</article-title>
        <source>J Public Health (Oxf)</source>  
        <year>2015</year>  
        <month>06</month>  
        <volume>37</volume>  
        <issue>2</issue>  
        <fpage>313</fpage>  
        <lpage>21</lpage>  
        <pub-id pub-id-type="doi">10.1093/pubmed/fdu042</pub-id>
        <pub-id pub-id-type="medline">25012531</pub-id>
        <pub-id pub-id-type="pii">fdu042</pub-id></nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
