<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMIR</journal-id>
      <journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id>
      <journal-title>Journal of Medical Internet Research</journal-title>
      <issn pub-type="epub">1438-8871</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v23i8e26843</article-id>
      <article-id pub-id-type="pmid">34448704</article-id>
      <article-id pub-id-type="doi">10.2196/26843</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Predicting Kidney Graft Survival Using Machine Learning Methods: Prediction Model Development and Feature Significance Analysis Study</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Kukafka</surname>
            <given-names>Rita</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Giabbanelli</surname>
            <given-names>Philippe</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Mahmoudi</surname>
            <given-names>Elham</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Naqvi</surname>
            <given-names>Syed Asil Ali</given-names>
          </name>
          <degrees>MCS</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Department of Computer Science</institution>
            <institution>Dalhousie University</institution>
            <addr-line>Goldberg Computer Science Bldg</addr-line>
            <addr-line>6050 University Ave</addr-line>
            <addr-line>Halifax, NS, B3H 1W5</addr-line>
            <country>Canada</country>
            <phone>1 9023290504</phone>
            <email>a.naqvi@dal.ca</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-1422-3793</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Tennankore</surname>
            <given-names>Karthik</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-7919-6709</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Vinson</surname>
            <given-names>Amanda</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-9345-5252</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Roy</surname>
            <given-names>Patrice C</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-8635-0305</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Abidi</surname>
            <given-names>Syed Sibte Raza</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-3075-7736</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Department of Computer Science</institution>
        <institution>Dalhousie University</institution>
        <addr-line>Halifax, NS</addr-line>
        <country>Canada</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Division of Nephrology</institution>
        <institution>Dalhousie University</institution>
        <addr-line>Halifax, NS</addr-line>
        <country>Canada</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Syed Asil Ali Naqvi <email>a.naqvi@dal.ca</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <month>8</month>
        <year>2021</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>27</day>
        <month>8</month>
        <year>2021</year>
      </pub-date>
      <volume>23</volume>
      <issue>8</issue>
      <elocation-id>e26843</elocation-id>
      <history>
        <date date-type="received">
          <day>4</day>
          <month>1</month>
          <year>2021</year>
        </date>
        <date date-type="rev-request">
          <day>1</day>
          <month>2</month>
          <year>2021</year>
        </date>
        <date date-type="rev-recd">
          <day>10</day>
          <month>3</month>
          <year>2021</year>
        </date>
        <date date-type="accepted">
          <day>6</day>
          <month>5</month>
          <year>2021</year>
        </date>
      </history>
      <copyright-statement>©Syed Asil Ali Naqvi, Karthik Tennankore, Amanda Vinson, Patrice C Roy, Syed Sibte Raza Abidi. Originally published in the Journal of Medical Internet Research (https://www.jmir.org), 27.08.2021.</copyright-statement>
      <copyright-year>2021</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research, is properly cited. The complete bibliographic information, a link to the original publication on https://www.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://www.jmir.org/2021/8/e26843" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Kidney transplantation is the optimal treatment for patients with end-stage renal disease. Short- and long-term kidney graft survival is influenced by a number of donor and recipient factors. Predicting the success of kidney transplantation is important for optimizing kidney allocation.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>The aim of this study was to predict the risk of kidney graft failure across three temporal cohorts (within 1 year, within 5 years, and after 5 years following a transplant) based on donor and recipient characteristics. We analyzed a large data set comprising over 50,000 kidney transplants covering an approximate 20-year period.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>We applied machine learning–based classification algorithms to develop prediction models for the risk of graft failure for three different temporal cohorts. Deep learning–based autoencoders were applied for data dimensionality reduction, which improved the prediction performance. The influence of features on graft survival for each cohort was studied by investigating a new nonoverlapping patient stratification approach.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>Our models predicted graft survival with area under the curve scores of 82% within 1 year, 69% within 5 years, and 81% within 17 years. The feature importance analysis elucidated the varying influence of clinical features on graft survival across the three different temporal cohorts.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>In this study, we applied machine learning to develop risk prediction models for graft failure that demonstrated a high level of prediction performance. Acknowledging that these models performed better than those reported in the literature for existing risk prediction tools, future studies will focus on how best to incorporate these prediction models into clinical care algorithms to optimize the long-term health of kidney recipients.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>kidney transplantation</kwd>
        <kwd>machine learning</kwd>
        <kwd>predictive modeling</kwd>
        <kwd>survival prediction</kwd>
        <kwd>dimensionality reduction</kwd>
        <kwd>feature sensitivity analysis</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <sec>
        <title>Background</title>
        <p>Kidneys are vital for the health of an individual, as they filter waste products from the blood and produce hormones and urine [<xref ref-type="bibr" rid="ref1">1</xref>]. Patients are considered to have end-stage renal disease when their kidney function falls below a specific threshold [<xref ref-type="bibr" rid="ref2">2</xref>]. A lack of timely measures to prevent kidney failure results in premature death [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref4">4</xref>].</p>
        <p>Kidney transplantation [<xref ref-type="bibr" rid="ref5">5</xref>,<xref ref-type="bibr" rid="ref6">6</xref>] and dialysis are the two main treatments for kidney failure [<xref ref-type="bibr" rid="ref7">7</xref>]. Kidney transplantation offers a survival advantage compared with other forms of kidney replacement therapy; however, the rate of graft loss following transplant is still undesirably high [<xref ref-type="bibr" rid="ref8">8</xref>]. Kidneys are a limited resource, and optimizing the match between donors and recipients is crucial for improving outcomes after transplantation. Kidney transplant allocation is, in part, based on a number of donor-recipient–related factors that influence graft survival. Various clinical studies have been conducted on the influence of these factors on graft survival; however, given the complex interactions between these factors, there remains much to be learned in this area. Existing risk prediction models only have a limited ability to predict outcomes for kidney transplant recipients with receiver operating characteristic scores of 0.6-0.7 [<xref ref-type="bibr" rid="ref9">9</xref>-<xref ref-type="bibr" rid="ref11">11</xref>].</p>
        <p>Prediction modeling using machine learning (ML) algorithms has gained attention in recent years [<xref ref-type="bibr" rid="ref12">12</xref>] for predicting the success of clinical or surgical procedures (such as kidney transplant). ML algorithms autonomously learn the underlying associations between preprocedure clinical features and postprocedural outcomes to predict the outcome of the procedure for a given clinical case. In kidney transplant, ML-based prediction models, based on donor-recipient information, autonomously learn the underlying relationships between donor and recipient factors to predict transplant outcomes. Multiple studies have been conducted using ML methods to predict the kidney graft outcome [<xref ref-type="bibr" rid="ref13">13</xref>-<xref ref-type="bibr" rid="ref16">16</xref>]; however, the standard approach in nearly all the reviewed studies has been to select one or more arbitrary period starting from the date of transplant and applying classification algorithms for prediction. There is a clear need for further exploration of data stratification approaches and other ML methods with respect to feature engineering and prediction modeling.</p>
      </sec>
      <sec>
        <title>Objectives</title>
        <p>In this study, the intent is to investigate kidney transplant allograft survival, that is, estimating the time-to-event and the evolving influence of clinical features leading to an event—within three temporal cohorts of 1 year, &#62;1-5 years, and &#62;5 years of a kidney transplant. We predicted the outcome of graft failure after kidney transplant based on the analysis of donor and recipient features. We applied ML methods to (1) predict the graft status over different temporal periods and (2) analyze the changing effect of donor-recipient–related predictors across different periods. To develop the prediction models, we analyzed a large data set of over 50,000 transplants covering approximately a 20-year period of kidney transplants in the United States. To generate the clinically meaningful temporal cohorts, we experimented with two patient stratification approaches: (1) a novel <italic>nonoverlapping</italic> patient stratification approach, whereby a patient’s graft failure was recorded only in the temporal cohort when it actually happened, that is, a graft failure event in the preceding cohort was not included and (2) the traditional <italic>overlapping</italic> patient stratification approach that provides an accumulative count of graft outcomes until a specific time point. To develop the prediction models, we investigated multiple ML algorithms using both patient stratification approaches. Nonoverlapping temporal cohorts were considered to investigate the influence of clinical features on predicting graft survival over time, as the temporal partitioning of the data allowed for the establishment of feature influence across distinct temporal windows. We applied the feature importance method based on the mean decrease in impurity (Gini).</p>
        <p>The contributions of this research are as follows: (1) ML-based prediction models that are trained on a large data set, offering improved prediction performance compared with previous studies (previous graft prediction studies are based on a smaller number of transplants over a shorter period); (2) data dimensionality reduction based on a deep learning framework to handle the high-dimensional and complex kidney transplant data set; (3) a novel nonoverlapping patient stratification approach to provide fine-grained feature importance within a specific period while avoiding bias from preceding cohorts; (4) explaining the influence of the different clinical features, during different periods, toward the prediction performance of ML prediction models. This finding allows the selection of the most important features to predict graft outcomes within a specific temporal window; and (5) a comparison between the two stratification approaches with respect to the performance of the prediction models. The future practical outcome of this study is the provision of a data-driven decision support tool to assist nephrologists in the kidney allocation process by identifying the best donor and recipient pair that will lead to the highest likelihood of graft survival for a given recipient.</p>
      </sec>
      <sec>
        <title>Prior Work</title>
        <p>Patients can receive a kidney from either deceased donors or living donors. The donor-recipient matching process becomes relatively more complex with deceased donors because of the need to account for additional clinical factors (ie, prolonged cold ischemia time, prolonged wait times, and generally lower quality organs) [<xref ref-type="bibr" rid="ref17">17</xref>]. Given the fact that kidney organs are a limited resource, it is important to have an efficient and effective donor-recipient matching process to ensure long-term graft survival [<xref ref-type="bibr" rid="ref18">18</xref>].</p>
        <p>Data-driven methods are now being used for organ matching; these methods are used to establish clinical compatibility beyond the blood group and tissue type. Conventional data-driven prediction methods use statistical techniques such as Cox proportional hazard models and Kaplan-Meier estimates to perform time-to-event analyses [<xref ref-type="bibr" rid="ref19">19</xref>]. Significant research has been conducted with Cox-based models in the survival analysis of different organ transplants; however, these methods eventually lose predictive accuracy as the feature space increases [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref14">14</xref>].</p>
        <p>ML-based data analysis to develop prediction models for predicting outcomes is usually performed using classification methods, whereas regression methods are used for time-to-event analysis. There are two prominent approaches to predict kidney allograft outcomes using ML-based classification methods. The first approach is to predict graft survival over time by dividing a longitudinal data set into different time cohorts based on the occurrence of a given adverse event or the last follow-up date from the date of transplant. Each time cohort has a binary target variable, that is, success or failure of the graft, which is used to train the classification model to predict graft survival [<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref16">16</xref>]. The second approach is to predict the risk acuity associated with a graft within a period. Topuz et al [<xref ref-type="bibr" rid="ref15">15</xref>] used this approach and divided the data set into three graft failure risk groups (high, medium, and low) across three different periods to predict the risk of graft failure within a specific time using classification methods. Li et al [<xref ref-type="bibr" rid="ref20">20</xref>] used Bayes net to classify graft risk levels and predict graft survival.</p>
        <p>Due to the high dimensionality of existing data sets for organ transplantation, feature selection is applied to filter out redundant features. A stacked autoencoder, which is an unsupervised neural network, is an efficient dimensionality reduction technique with promising performance for deep representation of medical data [<xref ref-type="bibr" rid="ref21">21</xref>] that reconstructs its own inputs by first encoding them to a smaller size and then decoding back to the original inputs. A comparative study by Sadati et al [<xref ref-type="bibr" rid="ref22">22</xref>] highlighted the efficacy of different types of autoencoders for data sets based on electronic health records.</p>
        <p>Right-censored data are a common problem for survival analysis, as it represents cases for which the adverse event is not available or recorded because of either the subject having been lost to follow-up or not experiencing the event during the study period. Multiple approaches have been adopted in previous studies to address this problem. The study on kidney transplants by Topuz et al [<xref ref-type="bibr" rid="ref15">15</xref>] discarded all the right-censored data before 7 years from the time of transplant and included the remaining transplants that took place after that time point in the low-risk group. In a study predicting heart transplant outcomes, the data set was divided into three different time cohorts (1, 5, and 9 years) to predict the status of the graft. Patients who did not have graft failure during a particular time cohort were censored, and all the patients beyond that time cohort were considered to have successful transplants [<xref ref-type="bibr" rid="ref23">23</xref>].</p>
        <p>The influence of clinical features (or clinical predictors) on graft survival tends to vary over time [<xref ref-type="bibr" rid="ref16">16</xref>], as shown using a heat map [<xref ref-type="bibr" rid="ref24">24</xref>]. Dag et al [<xref ref-type="bibr" rid="ref23">23</xref>] analyzed the changing significance of features for three overlapping time cohorts (1, 5, and 9 years). They deduced that certain types of features perform well in the long term compared with the short and medium terms. For instance, socioeconomic factors were more influential in their 9-year time cohort as they covered major variations in the data. It is important to note here that feature significance over time can only be substantiated if the analysis is performed with nonoverlapping cohorts to avoid any bias introduced by the cumulative effect of data before the analysis period.</p>
        <p>In previous studies [<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref20">20</xref>-<xref ref-type="bibr" rid="ref22">22</xref>,<xref ref-type="bibr" rid="ref25">25</xref>], predicting graft failure has been pursued by taking an overlapping patient stratification approach, which means that each subsequent time cohort includes data from the previous cohort. This introduces a cumulative effect that is useful for predicting graft failure across a staggered time period. However, the overlapping patient stratification approach is ineffective in determining the influence of clinical features during a specific time period. Hence, the nonoverlapped cohort approach offers a novel mechanism to investigate the influence of clinical features within specific time windows. To the best of our knowledge, nonoverlapping cohorts have not been studied in the literature to develop prediction models or analyze the temporal influence of clinical features on kidney transplant outcomes.</p>
        <p>This study is organized into five major sections: <italic>Methods</italic> presents the study’s methodology; <italic>Results</italic> presents the results of the prediction; and <italic>Discussion</italic> discusses the significance of clinical features toward graft status prediction across different time cohorts and offers a conclusion and future research directions.</p>
      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Overview</title>
        <p>To predict graft survival over time and to analyze the influence of clinical features on graft survival, our data analytics methodology (<xref rid="figure1" ref-type="fig">Figure 1</xref>) comprised data preparation, feature engineering, prediction modeling, model evaluation, and analysis of changing relevance of features.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Overview of our data analytics methodology. AUC: area under the curve; SMOTE: synthetic minority oversampling technique; UNOS: united network of organ sharing.</p>
          </caption>
          <graphic xlink:href="jmir_v23i8e26843_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Data Description</title>
        <p>This study used data from the Scientific Registry of Transplant Recipients (SRTR). The SRTR data system includes data on all donors, wait-listed candidates, and transplant recipients in the United States, submitted by the members of the Organ Procurement and Transplantation Network. The Health Resources and Services Administration and the US Department of Health and Human Services provided an overview of the activities of the Organ Procurement and Transplantation Network and SRTR contractors.</p>
        <p>The data set provided pretransplant clinical features and outcomes of 277,316 kidney transplants between 2000 and 2017. Survival was reported in terms of graft outcome and patient status. For the purposes of this study, graft failure was defined as (1) graft loss or (2) death with a functioning graft.</p>
        <p>We analyzed the data and used only complete cases (ie, no missing feature values), which comprised a total of 52,827 kidney transplants. <xref ref-type="table" rid="table1">Table 1</xref> provides a list of the included clinical features and their descriptions used in our experiments.</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>List of clinical features used to train the prediction models.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="500"/>
            <col width="250"/>
            <col width="250"/>
            <thead>
              <tr valign="top">
                <td>Feature description</td>
                <td>Data type</td>
                <td>Abbreviation</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Peak panel reactive antibody</td>
                <td>Continuous</td>
                <td>PKPRA</td>
              </tr>
              <tr valign="top">
                <td>Type of transplant</td>
                <td>Categorical</td>
                <td>REC_TX_PROCEDURE</td>
              </tr>
              <tr valign="top">
                <td>Any previous kidney transplant</td>
                <td>Categorical</td>
                <td>PREVKI</td>
              </tr>
              <tr valign="top">
                <td>Donor age</td>
                <td>Continuous</td>
                <td>DAGE</td>
              </tr>
              <tr valign="top">
                <td>Donor height</td>
                <td>Continuous</td>
                <td>DHT100</td>
              </tr>
              <tr valign="top">
                <td>Recipient height</td>
                <td>Continuous</td>
                <td>RHT2100</td>
              </tr>
              <tr valign="top">
                <td>Donor weight</td>
                <td>Continuous</td>
                <td>DWT</td>
              </tr>
              <tr valign="top">
                <td>Recipient weight</td>
                <td>Continuous</td>
                <td>RWT2</td>
              </tr>
              <tr valign="top">
                <td>Donor creatinine level</td>
                <td>Continuous</td>
                <td>DONCREAT</td>
              </tr>
              <tr valign="top">
                <td>Expanded criteria donor</td>
                <td>Categorical</td>
                <td>ECD</td>
              </tr>
              <tr valign="top">
                <td>Donation after cardiac death</td>
                <td>Categorical</td>
                <td>DCD</td>
              </tr>
              <tr valign="top">
                <td>Donor hypertension</td>
                <td>Categorical</td>
                <td>DHTN2</td>
              </tr>
              <tr valign="top">
                <td>Recipient hypertension</td>
                <td>Categorical</td>
                <td>RHTN</td>
              </tr>
              <tr valign="top">
                <td>Recipient BMI</td>
                <td>Continuous</td>
                <td>RBMI2</td>
              </tr>
              <tr valign="top">
                <td>Donor BMI</td>
                <td>Continuous</td>
                <td>DBMI</td>
              </tr>
              <tr valign="top">
                <td>Cold ischemia time</td>
                <td>Continuous</td>
                <td>CIT</td>
              </tr>
              <tr valign="top">
                <td>Recipient age</td>
                <td>Continuous</td>
                <td>RAGETX</td>
              </tr>
              <tr valign="top">
                <td>Number of HLA antigen mismatches (paired)</td>
                <td>Categorical</td>
                <td>HLAMM</td>
              </tr>
              <tr valign="top">
                <td>Functional status of the recipient</td>
                <td>Categorical</td>
                <td>FUNCTSTAT</td>
              </tr>
              <tr valign="top">
                <td>Donor-recipient sex (paired)</td>
                <td>Categorical</td>
                <td>DRSEX</td>
              </tr>
              <tr valign="top">
                <td>Donor-recipient race (paired)</td>
                <td>Categorical</td>
                <td>DRRACE</td>
              </tr>
              <tr valign="top">
                <td>Donor-recipient age (paired)</td>
                <td>Categorical</td>
                <td>DRAGE</td>
              </tr>
              <tr valign="top">
                <td>Recipient cardiovascular disease</td>
                <td>Categorical</td>
                <td>RCVD</td>
              </tr>
              <tr valign="top">
                <td>Donor hepatitis C virus</td>
                <td>Categorical</td>
                <td>DHCV</td>
              </tr>
              <tr valign="top">
                <td>Recipient peripheral vascular disease</td>
                <td>Categorical</td>
                <td>RPVD</td>
              </tr>
              <tr valign="top">
                <td>Donor race</td>
                <td>Categorical</td>
                <td>DRACESIMP</td>
              </tr>
              <tr valign="top">
                <td>Recipient race</td>
                <td>Categorical</td>
                <td>RRACESIMP</td>
              </tr>
              <tr valign="top">
                <td>Recipient malignancy</td>
                <td>Categorical</td>
                <td>RMALIG</td>
              </tr>
              <tr valign="top">
                <td>Years on dialysis pretransplant</td>
                <td>Continuous</td>
                <td>VINTAGE</td>
              </tr>
              <tr valign="top">
                <td>Donor diabetes</td>
                <td>Categorical</td>
                <td>DDM</td>
              </tr>
              <tr valign="top">
                <td>Preemptive transplant</td>
                <td>Categorical</td>
                <td>PREEMPTIVE</td>
              </tr>
              <tr valign="top">
                <td>Recipient diabetes</td>
                <td>Categorical</td>
                <td>RDM2</td>
              </tr>
              <tr valign="top">
                <td>Recipient coronary artery disease</td>
                <td>Categorical</td>
                <td>RCAD</td>
              </tr>
              <tr valign="top">
                <td>Simplified ESRD<sup>a</sup> diagnosis</td>
                <td>Categorical</td>
                <td>ESRDDXSIMP</td>
              </tr>
              <tr valign="top">
                <td>Donor-recipient CMV<sup>b</sup> (paired)</td>
                <td>Categorical</td>
                <td>DRCMV</td>
              </tr>
              <tr valign="top">
                <td>Donor-recipient height difference</td>
                <td>Categorical</td>
                <td>AHD1</td>
              </tr>
              <tr valign="top">
                <td>Donor-recipient weight difference</td>
                <td>Categorical</td>
                <td>DRWT</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>ESRD: end-stage renal disease.</p>
            </fn>
            <fn id="table1fn2">
              <p><sup>b</sup>CMV: cytomegalovirus.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Data Preparation</title>
        <p>Data preparation for learning the ML-based prediction models consisted of data cleaning, partitioning the data set into temporal cohorts, and addressing class imbalances.</p>
        <sec>
          <title>Data Cleaning</title>
          <p>Data cleaning involved removing (1) all patient identifying features (such as transplant ID, donor ID, and patient ID) [<xref ref-type="bibr" rid="ref23">23</xref>], (2) post- and intraoperative features (such as delayed graft function and warm ischemia time) as we focused on pretransplant features to predict outcomes [<xref ref-type="bibr" rid="ref23">23</xref>], (3) living donors [<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref26">26</xref>], (4) recipients below the age of 18 years [<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref28">28</xref>], and (5) all sequential and en bloc transplants, both of which are atypical procedures that would not broadly apply to most deceased donor situations. These exclusion criteria were suggested by domain experts and also noted in prior studies [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref28">28</xref>].</p>
        </sec>
        <sec>
          <title>Data Partitioning Into Temporal Cohorts</title>
          <p>Given the longitudinal data set, we generated two distinct data sets using traditional <italic>overlapping</italic> and our novel <italic>nonoverlapping</italic> patient stratification approaches to partition the data set into three temporal cohorts representing graft status at 1 year, &#62;1-5 years, and 5-17 years (<xref rid="figure2" ref-type="fig">Figures 2</xref> and <xref rid="figure3" ref-type="fig">3</xref>).</p>
          <fig id="figure2" position="float">
            <label>Figure 2</label>
            <caption>
              <p>Derivation of the overlapped cohorts.</p>
            </caption>
            <graphic xlink:href="jmir_v23i8e26843_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
          <fig id="figure3" position="float">
            <label>Figure 3</label>
            <caption>
              <p>Derivation of the nonoverlapped cohorts.</p>
            </caption>
            <graphic xlink:href="jmir_v23i8e26843_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
          <p>The overlapping patient stratification approach (used in previous graft status prediction studies) provides a cumulative analysis of graft outcomes up to a specific time point. In our study, the overlapping data stratification resulted in the following three cohorts: cohort 1, spanning from year<sub>0</sub> to year<sub>1</sub>, which reported graft outcomes (ie, graft failure or survival) during this period; cohort 2, which reported graft status from year<sub>0</sub> to year<sub>5</sub> and overlapped with cohort 1 such that it included the patients in cohort 1<italic>;</italic> and cohort 3<italic>,</italic> which reported graft status from year<sub>0</sub> to year<sub>10+</sub>, thus overlapping with both earlier cohorts. As per the overlapping approach, a graft failure in the preceding cohort was also counted in the proceeding cohort.</p>
          <p>Our nonoverlapping patient stratification approach yielded three cohorts: cohort 1<italic>,</italic> spanning year<sub>0</sub> to year<sub>1,</sub> reporting graft outcomes in this period; cohort 2, spanning year<sub>1</sub> to year<sub>5</sub> and reporting graft outcomes only in this period, resulting in the exclusion of graft failures reported in cohort 1 and only reporting the graft outcomes of patients who survived cohort 1<italic>;</italic> and cohort 3, spanning year<sub>5</sub> to year<sub>10+</sub>, reporting the graft outcomes of patients who survived cohort 2<italic>.</italic> In a nonoverlapping cohort approach, there was no looking back beyond the cohort’s starting point, as such a graft failure in the preceding cohort was not counted in the proceeding cohort.</p>
          <p>When partitioning the data into cohorts, we accounted for the presence of censored data, that is, the lack of information about the occurrence of an adverse event for a surviving patient. There is no concrete method to determine survivors when confronted with censored data. We initially assumed that those patients who did not fail in a certain cohort could be presumed as survivors. However, this assumption led to two problems: (1) it included censored patients who might have experienced graft failure during the study, and (2) it led to a severe class imbalance between the graft failure and surviving patients. To overcome these problems, we took a two-phase heuristic approach to remove the censored observations to identify <italic>survivors</italic> in each cohort. First, we removed all the censored observations from the cohort being analyzed and labeled all the remaining instances as survived. For instance, the censored data that were removed for cohort 2 were all instances with a missing outcome by the end of cohort 2. The remaining instances were considered to have survived. The first phase of our approach reduced the number of censored observations, but the surviving observations were still relatively high compared with the graft failure cases in each cohort. In the second phase, we applied the approach of Topuz et al [<xref ref-type="bibr" rid="ref15">15</xref>] to further refine our surviving class by removing all the instances that were deemed as surviving for less than 8 years from the date of transplant. This two-phase approach to account for censored data is summarized in Equation 1 below, where we estimated the number of survivors in each cohort.</p>
          <graphic xlink:href="jmir_v23i8e26843_fig9.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          <p>The first part of this equation illustrates the first phase of the proposed approach. The <italic>i</italic> in the equation is the ending year of our defined cohorts, that is, 1, 5, and 17. The equation first calculates the total number of graft failures that occurred after the end of the cohort. This fraction of instances was considered as confirmed survivors for the cohort under analysis. The second part of the equation deals with the second phase of the approach. It attempts to identify the potential survivors from the censored data by removing all the observations that did not have a graft failure within 8 years (2920 days) following a transplant. <xref ref-type="table" rid="table2">Table 2</xref> shows the patient distribution across the three time cohorts.</p>
          <table-wrap position="float" id="table2">
            <label>Table 2</label>
            <caption>
              <p>Number of failed and survived transplants in overlapped and nonoverlapped cohorts.</p>
            </caption>
            <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
              <col width="100"/>
              <col width="110"/>
              <col width="170"/>
              <col width="170"/>
              <col width="0"/>
              <col width="110"/>
              <col width="170"/>
              <col width="170"/>
              <thead>
                <tr valign="top">
                  <td>Cohort</td>
                  <td colspan="4">Overlapping</td>
                  <td colspan="3">Nonoverlapping</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Count, n</td>
                  <td>Failed, n (%)</td>
                  <td>Survived, n (%)</td>
                  <td colspan="2">Count, n</td>
                  <td>Failed, n (%)</td>
                  <td>Survived, n (%)</td>
                </tr>
              </thead>
              <tbody>
                <tr valign="top">
                  <td>1</td>
                  <td>52,827</td>
                  <td>7554 (14.3)</td>
                  <td>45,273 (85.7)</td>
                  <td colspan="2">52,827</td>
                  <td>7554 (14.3)</td>
                  <td>45,273 (85.7)</td>
                </tr>
                <tr valign="top">
                  <td>2</td>
                  <td>52,827</td>
                  <td>23,475 (44.44)</td>
                  <td>29,352 (55.56)</td>
                  <td colspan="2">45,273</td>
                  <td>15,921 (35.17)</td>
                  <td>29,352 (64.83)</td>
                </tr>
                <tr valign="top">
                  <td>3</td>
                  <td>52,827</td>
                  <td>37,939 (71.82)</td>
                  <td>14,888 (28.18)</td>
                  <td colspan="2">29,352</td>
                  <td>14,464 (49.28)</td>
                  <td>14,888 (50.72)</td>
                </tr>
              </tbody>
            </table>
          </table-wrap>
        </sec>
      </sec>
      <sec>
        <title>Addressing Class Imbalance</title>
        <p>Our data set had two outcomes: the presence or absence of graft failure. There was a significant class imbalance whereby the <italic>graft failure</italic> had a significantly lower number of instances compared with <italic>graft survival.</italic> Techniques such as Synthetic Minority Oversampling Technique (SMOTE) and random undersampling have been widely used in the literature [<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref29">29</xref>] for class imbalance. We applied SMOTE for Nominal and Continuous features [<xref ref-type="bibr" rid="ref30">30</xref>], which is a variant of SMOTE specifically developed to handle a mix of categorical and numerical data, on all cohorts to achieve a reasonable class balance. To balance the minority class (ie, mostly <italic>graft failure</italic>), we would need to generate 600% additional synthetic samples (at least for cohort 1), which would have led to overfitting. Therefore, we doubled our minority class to achieve a workable class balance to prevent the overfitting of the classification models. As cohort 2 of overlapped stratification and cohort 3 of nonoverlapped stratification had a class balance, they were not considered for oversampling.</p>
      </sec>
      <sec>
        <title>Feature Engineering</title>
        <p>This step involved both the removal and construction of features with the intent to reduce the dimensionality of the feature space.</p>
        <sec>
          <title>Paired Features</title>
          <p>A set of paired features was constructed by combining the related features. Typically, graft predictions use discrete individual donor and recipient features. We examined the underlying correlation between the donor and recipient features and paired the highly related features to generate new <italic>paired features</italic>. The following four donor and recipient features were generated: sex, age, CMV (cytomegalovirus), and race. In addition, three types of HLA Antigen Mismatch features—ie, HLA Antigen Mismatch at the A Locus, HLA Antigen Mismatch at the B Locus, and HLA Antigen Mismatch at the DR Locus were also combined into a single HLA Antigen Mismatch feature.</p>
        </sec>
        <sec>
          <title>One-Hot Encoding</title>
          <p>We transformed the categorical features into multiple dummy features to make them compatible with the stacked autoencoders, which cannot process categorical features. In addition, it was also a necessary operation because of the functional constraint of the scikit-learn library [<xref ref-type="bibr" rid="ref31">31</xref>].</p>
        </sec>
        <sec>
          <title>Stacked Autoencoders</title>
          <p>Finally, we used 86 transformed categorical features as inputs to the stacked autoencoders for feature reduction to subsequently train the ML prediction models. Continuous features were also initially considered as a part of the input vector to stacked autoencoders (Table S1 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>), but preliminary model training returned better results with pristine continuous features; hence, no modification was performed for them while training the prediction models. It should be noted that the resultant features from the stacked autoencoders were only used for training the prediction models and not for the analysis of the changing relevance of features over time.</p>
          <p>After testing with different configuration settings provided in the Keras framework [<xref ref-type="bibr" rid="ref32">32</xref>], the stacked autoencoders were set up as a 13-layer architecture consisting of 12 dense layers and one dropout layer set at the very beginning of the network with a dropout rate of 0.05. The sigmoid activation function was used throughout the dense layers, with Adam as the optimizer and binary cross entropy as the loss function with 500 epochs and 700-900 batch sizes. The middle layer of the autoencoder was finally trained with 12 neurons and 30 neurons for cohort 1 and the remaining cohorts, respectively. The feature space was reduced by more than 50 dummy features.</p>
        </sec>
      </sec>
      <sec>
        <title>Learning Classification-Based Graft Survival Prediction Models</title>
        <sec>
          <title>Overview</title>
          <p>Prediction was pursued as a binary classification problem, where the prediction output represents the graft outcome for a given patient in terms of the class label, graft failure or survived. We investigated four different ML-based classification models for each time cohort (ie, cohorts 1-3). Given that logistic regression (LR) has been widely used in prior studies to develop graft prediction models [<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref33">33</xref>], we trained an LR model as a baseline to compare the predictive performance of our ML prediction models.</p>
          <p>All classification models were trained using a 10-fold stratified cross-validation training approach. The stratification ensured that outcome class ratio in each fold is maintained to avoid any sampling bias that may affect the classification results. We mainly used the scikit-learn library [<xref ref-type="bibr" rid="ref31">31</xref>] to train the below-mentioned classification models with the parameter settings listed in <xref ref-type="table" rid="table3">Table 3</xref>. Hyperparameters were optimized using a random search. The different parameters that were tested during the random search are provided in Table S2 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p>
          <table-wrap position="float" id="table3">
            <label>Table 3</label>
            <caption>
              <p>Algorithmic settings for the classifiers.</p>
            </caption>
            <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
              <col width="30"/>
              <col width="470"/>
              <col width="500"/>
              <thead>
                <tr valign="top">
                  <td colspan="2">Method, Hyperparameter</td>
                  <td>Values</td>
                </tr>
              </thead>
              <tbody>
                <tr valign="top">
                  <td colspan="3">
                    <bold>RF<sup>a</sup></bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Number of estimators</td>
                  <td>200</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Class weight</td>
                  <td>Balanced</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Criterion</td>
                  <td>Gini</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Maximum depth</td>
                  <td>9</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Minimum samples split</td>
                  <td>2 for cohort 1; 3 for the rest</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Maximum features</td>
                  <td>14</td>
                </tr>
                <tr valign="top">
                  <td colspan="3">
                    <bold>Support vector machine</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>C<sup>b</sup></td>
                  <td>50</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Gamma</td>
                  <td>Auto, scale</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Decision function shape</td>
                  <td>One versus rest</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Kernel</td>
                  <td>Radial</td>
                </tr>
                <tr valign="top">
                  <td colspan="3">
                    <bold>Artificial neural network</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Solver</td>
                  <td>Adam</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Learning rate</td>
                  <td>Adaptive</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Activation</td>
                  <td>Logistic</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Alpha</td>
                  <td>1e-2,1e-6</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Hidden layers</td>
                  <td><italic>4</italic>: 70, 35, 30, 15; <italic>5</italic>: 60, 30, 30, 15, 10</td>
                </tr>
                <tr valign="top">
                  <td colspan="3">
                    <bold>Adaptive boosting</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Base learner</td>
                  <td>RF</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Number of estimators</td>
                  <td>401</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Learning rate</td>
                  <td>1</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Algorithm</td>
                  <td>Samme.R</td>
                </tr>
                <tr valign="top">
                  <td colspan="3">
                    <bold>Logistic regression</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Penalty</td>
                  <td>l2</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>C</td>
                  <td>10</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Class weight</td>
                  <td>Balanced</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Max iteration</td>
                  <td>1000</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Solver</td>
                  <td>Sag</td>
                </tr>
              </tbody>
            </table>
            <table-wrap-foot>
              <fn id="table3fn1">
                <p><sup>a</sup>RF: random forest.</p>
              </fn>
              <fn id="table3fn2">
                <p><sup>b</sup>C: regularization parameter.</p>
              </fn>
            </table-wrap-foot>
          </table-wrap>
        </sec>
        <sec>
          <title>Random Forest</title>
          <p>Random forest (RF) was used as both a standalone classifier and a base learner for the adaptive boosting (AdaBoost) algorithm. It has been widely used to predict survival data [<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref27">27</xref>].</p>
        </sec>
        <sec>
          <title>AdaBoost</title>
          <p>The AdaBoost algorithm was applied to two weak learners, RF and LR. The study by Thongkam et al [<xref ref-type="bibr" rid="ref34">34</xref>] used this algorithm on a breast cancer data set, where it outperformed all single classifiers. In our experiments, LR did not perform well; therefore, we did not pursue it. RF, with the optimized hyperparameters, was used to train the boosting classifier with a number of estimators and learning rates.</p>
        </sec>
        <sec>
          <title>Artificial Neural Network</title>
          <p>A backpropagation algorithm was used to train a neural network–based binary classifier. Generally, artificial neural networks (ANNs) perform well on survival data sets [<xref ref-type="bibr" rid="ref30">30</xref>,<xref ref-type="bibr" rid="ref35">35</xref>].</p>
        </sec>
        <sec>
          <title>Support Vector Machines</title>
          <p>Classification models using support vector machines (SVMs) have been applied to predict survival data [<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref32">32</xref>]. To train the SVM, we experimented with different kernels, that is, linear, radial, sigmoid, and polynomial kernels. The linear and sigmoid kernels provided the lowest prediction scores; therefore, we did not use them further. A polynomial kernel with degree 2 yielded suboptimal results, and the SVM model could not converge for degree 3. The radial basis kernel was the most effective for learning the classification model.</p>
        </sec>
      </sec>
      <sec>
        <title>Calculating Feature Importance Over Time</title>
        <p>The nonoverlapped time cohorts were used to calculate the feature importance scores to understand the changing relevance of features over time. We calculated these scores by training an RF classifier on the complete data set. The scores were calculated using Gini. Feature influence scores were used to understand the effect of features over the three cohorts.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Overview</title>
        <p>Below, we present the prediction performance of the four ML classifiers using both overlapped and nonoverlapped cohorts. As LR has been extensively used to predict time-to-event in organ transplant studies [<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref29">29</xref>], it is used as a comparator classifier to the ML-based classifiers. The prediction performance of each of the best-trained classifiers (SVM, RF, AdaBoost, ANN, and LR), covering the three different time-to-event periods for both the original and reduced feature sets, were evaluated using 10-fold stratified cross validation for both overlapped and nonoverlapped cohorts. The results of each classifier were examined using the area under the curve (AUC) and F1 scores. The AUC score was used as the main performance evaluation metric to select the best model in each cohort and to make comparisons with similar studies. For our purpose, the ideal prediction model provides the best accuracy for graft failure. Therefore, to further substantiate the selection of the best model, we also evaluated the F1 score for graft failures. In cases where the AUC score was the same for different models, preference was given to the model with the highest F1 score.</p>
      </sec>
      <sec>
        <title>Analysis of Feature Engineering</title>
        <p><xref ref-type="table" rid="table4">Table 4</xref> presents the results of feature engineering, whereby the prediction scores of all classifiers were obtained using both the original feature set and the reduced set. The reduced set consists of original continuous features and latent features returned by the stacked autoencoders. Cohort 1 for overlapped and nonoverlapped cohorts was the same; hence, the results were presented only once to avoid unnecessary duplication.</p>
        <table-wrap position="float" id="table4">
          <label>Table 4</label>
          <caption>
            <p>Area under the curve comparison—all features with auto-encoded features.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="350"/>
            <col width="0"/>
            <col width="150"/>
            <col width="0"/>
            <col width="160"/>
            <col width="0"/>
            <col width="150"/>
            <col width="0"/>
            <col width="160"/>
            <thead>
              <tr valign="top">
                <td colspan="3">Cohort</td>
                <td colspan="4">Overlapped</td>
                <td colspan="3">Nonoverlapped</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <break/>
                </td>
                <td colspan="2">All features (%)</td>
                <td colspan="2">Continuous+auto-encoded features (%)</td>
                <td colspan="2">All features (%)</td>
                <td>Continuous+auto-encoded features (%)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="10">
                  <bold>Cohort 1</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>SVM<sup>a</sup></td>
                <td colspan="2">80</td>
                <td colspan="2">82</td>
                <td colspan="2">N/A<sup>b</sup></td>
                <td colspan="2">N/A</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>AdaBoost<sup>c</sup></td>
                <td colspan="2">76</td>
                <td colspan="2">78</td>
                <td colspan="2">N/A</td>
                <td colspan="2">N/A</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>RF<sup>d</sup></td>
                <td colspan="2">68</td>
                <td colspan="2">70</td>
                <td colspan="2">N/A</td>
                <td colspan="2">N/A</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>ANN<sup>e</sup></td>
                <td colspan="2">62</td>
                <td colspan="2">61</td>
                <td colspan="2">N/A</td>
                <td colspan="2">N/A</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>LR<sup>f</sup></td>
                <td colspan="2">62</td>
                <td colspan="2">62</td>
                <td colspan="2">N/A</td>
                <td colspan="2">N/A</td>
              </tr>
              <tr valign="top">
                <td colspan="10">
                  <bold>Cohort 2</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>SVM</td>
                <td colspan="2">63</td>
                <td colspan="2">66</td>
                <td colspan="2">53</td>
                <td colspan="2">53</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>AdaBoost</td>
                <td colspan="2">67</td>
                <td colspan="2">69</td>
                <td colspan="2">64</td>
                <td colspan="2">60</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>RF</td>
                <td colspan="2">62</td>
                <td colspan="2">65</td>
                <td colspan="2">65</td>
                <td colspan="2">67</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>ANN</td>
                <td colspan="2">62</td>
                <td colspan="2">62</td>
                <td colspan="2">62</td>
                <td colspan="2">62</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>LR</td>
                <td colspan="2">62</td>
                <td colspan="2">62</td>
                <td colspan="2">64</td>
                <td colspan="2">61</td>
              </tr>
              <tr valign="top">
                <td colspan="10">
                  <bold>Cohort 3</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>SVM</td>
                <td colspan="2">73</td>
                <td colspan="2">80</td>
                <td colspan="2">68</td>
                <td colspan="2">65</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>AdaBoost</td>
                <td colspan="2">76</td>
                <td colspan="2">81</td>
                <td colspan="2">68</td>
                <td colspan="2">64</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>RF</td>
                <td colspan="2">72</td>
                <td colspan="2">75</td>
                <td colspan="2">68</td>
                <td colspan="2">66</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>ANN</td>
                <td colspan="2">73</td>
                <td colspan="2">72</td>
                <td colspan="2">68</td>
                <td colspan="2">65</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>LR</td>
                <td colspan="2">69</td>
                <td colspan="2">69</td>
                <td colspan="2">62</td>
                <td colspan="2">64</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table4fn1">
              <p><sup>a</sup>SVM: support vector machine.</p>
            </fn>
            <fn id="table4fn2">
              <p><sup>b</sup>N/A: not applicable.</p>
            </fn>
            <fn id="table4fn3">
              <p><sup>c</sup>AdaBoost: adaptive boosting.</p>
            </fn>
            <fn id="table4fn4">
              <p><sup>d</sup>RF: random forest.</p>
            </fn>
            <fn id="table4fn5">
              <p><sup>e</sup>ANN: artificial neural network.</p>
            </fn>
            <fn id="table4fn6">
              <p><sup>f</sup>LR: logistic regression.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>The AUC scores (<xref ref-type="table" rid="table4">Table 4</xref>) show that prediction models for overlapped cohorts trained with auto-encoded features improved the prediction performance as compared with the prediction models trained using the original feature set. However, it was the opposite for nonoverlapped cohorts. Interestingly, the traditional approach of overlapped cohorts performed better with both the original and reduced feature sets compared with the nonoverlapped cohorts. Except for RF in cohort 2 of nonoverlapped cohorts, which showed slightly better performance (67%) when compared with its overlapped counterpart (65%), all other prediction models had better AUC scores with the traditional overlapping cohort approach. Therefore, for further analysis, we proceeded with overlapping cohorts only.</p>
        <p>Although ANN and LR (the baseline model) showed no significant improvement across all three cohorts, the results confirmed the effectiveness of our deep learning architecture of stacked autoencoders for feature selection. For the subsequent prediction modeling analysis, we used the reduced feature set.</p>
      </sec>
      <sec>
        <title>Analysis of Prediction Performance of ML Models</title>
        <p><xref ref-type="table" rid="table5">Table 5</xref> presents the prediction performance of the classifiers for each cohort in terms of AUC, F1 scores, recall, and precision, with SD for the 10-fold classification.</p>
        <table-wrap position="float" id="table5">
          <label>Table 5</label>
          <caption>
            <p>Prediction performance of the machine learning classifiers across three different temporal cohorts using the overlapped patient stratification<sup>a</sup>.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="170"/>
            <col width="0"/>
            <col width="200"/>
            <col width="0"/>
            <col width="200"/>
            <col width="0"/>
            <col width="200"/>
            <col width="0"/>
            <col width="200"/>
            <thead>
              <tr valign="top">
                <td colspan="3">Cohort</td>
                <td colspan="7"> Auto-encoded feature set</td>
              </tr>
              <tr valign="bottom">
                <td colspan="3">
                  <break/>
                </td>
                <td colspan="2">AUC<sup>b</sup> (%), mean (SD)</td>
                <td colspan="2">F1 (%), mean (SD)</td>
                <td colspan="2">Recall (%), mean (SD)</td>
                <td>Precision (%), mean (SD)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="10">
                  <bold>Cohort 1</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <italic>SVM</italic>
                  <sup>c</sup>
                </td>
                <td colspan="2">
                  <italic>82 (0.01)</italic>
                </td>
                <td colspan="2">
                  <italic>61 (0.01)</italic>
                </td>
                <td colspan="2">
                  <italic>49 (0.01)</italic>
                </td>
                <td colspan="2">
                  <italic>90 (0.01)</italic>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>AdaBoost<sup>d</sup></td>
                <td colspan="2">78 (0.01)</td>
                <td colspan="2">56 (0.01)</td>
                <td colspan="2">95 (0.01)</td>
                <td colspan="2">35 (0.01)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>RF<sup>e</sup></td>
                <td colspan="2">70 (0.009)</td>
                <td colspan="2">45 (0.001)</td>
                <td colspan="2">47 (0.01)</td>
                <td colspan="2">41 (0.01)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>ANN<sup>f</sup></td>
                <td colspan="2">61 (0.01)</td>
                <td colspan="2">5 (0.001)</td>
                <td colspan="2">42 (0.01)</td>
                <td colspan="2">6 (0.004)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>LR<sup>g</sup></td>
                <td colspan="2">62 (0.008)</td>
                <td colspan="2">39 (0.009)</td>
                <td colspan="2">58 (0.01)</td>
                <td colspan="2">29 (0.04)</td>
              </tr>
              <tr valign="top">
                <td colspan="10">
                  <bold>Cohort 2</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>SVM</td>
                <td colspan="2">66 (0.006)</td>
                <td colspan="2">53 (0.01)</td>
                <td colspan="2">55 (0.01)</td>
                <td colspan="2">60 (0.01)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <italic>AdaBoost</italic>
                </td>
                <td colspan="2">
                  <italic>69 (0.01)</italic>
                </td>
                <td colspan="2">
                  <italic>63 (0.01)</italic>
                </td>
                <td colspan="2">
                  <italic>64 (0.003)</italic>
                </td>
                <td colspan="2">
                  <italic>63 (0.004)</italic>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>RF</td>
                <td colspan="2">65 (0.009)</td>
                <td colspan="2">62 (0.01)</td>
                <td colspan="2">62 (0.01)</td>
                <td colspan="2">61 (0.01)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>ANN</td>
                <td colspan="2">63 (0.007)</td>
                <td colspan="2">60 (0.04)</td>
                <td colspan="2">55 (0.09)</td>
                <td colspan="2">60 (0.01)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>LR</td>
                <td colspan="2">62 (0.008)</td>
                <td colspan="2">59 (0.009)</td>
                <td colspan="2">58 (0.01)</td>
                <td colspan="2">60 (0.004)</td>
              </tr>
              <tr valign="top">
                <td colspan="10">
                  <bold>Cohort 3</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>SVM</td>
                <td colspan="2">80 (0.005)</td>
                <td colspan="2">83 (0.003)</td>
                <td colspan="2">76 (0.003)</td>
                <td colspan="2">96 (0.003)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <italic>AdaBoost</italic>
                </td>
                <td colspan="2">
                  <italic>81 (0.01)</italic>
                </td>
                <td colspan="2">
                  <italic>81 (0.004)</italic>
                </td>
                <td colspan="2">
                  <italic>76 (0.003)</italic>
                </td>
                <td colspan="2">
                  <italic>86 (0.01)</italic>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>RF</td>
                <td colspan="2">75 (0.008)</td>
                <td colspan="2">75 (0.006)</td>
                <td colspan="2">75 (0.01)</td>
                <td colspan="2">73 (0.01)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>ANN</td>
                <td colspan="2">72 (0.007)</td>
                <td colspan="2">68 (0.005)</td>
                <td colspan="2">81 (0.03)</td>
                <td colspan="2">69 (0.01)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>LR</td>
                <td colspan="2">69 (0.001)</td>
                <td colspan="2">77 (0.009)</td>
                <td colspan="2">70 (0.01)</td>
                <td colspan="2">70 (0.001)</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table5fn1">
              <p><sup>a</sup>Italics show the classifiers with the highest performance among the three cohorts.</p>
            </fn>
            <fn id="table5fn2">
              <p><sup>b</sup>AUC: area under the curve.</p>
            </fn>
            <fn id="table5fn3">
              <p><sup>c</sup>SVM: support vector machine.</p>
            </fn>
            <fn id="table5fn4">
              <p><sup>d</sup>AdaBoost: adaptive boosting.</p>
            </fn>
            <fn id="table5fn5">
              <p><sup>e</sup>RF: random forest.</p>
            </fn>
            <fn id="table5fn6">
              <p><sup>f</sup>ANN: artificial neural network.</p>
            </fn>
            <fn id="table5fn7">
              <p><sup>g</sup>LR: logistic regression.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>The classifiers performed differently across the three cohorts—SVM offered the highest prediction performance for short-term predictions, that is, for cohort 1, whereas AdaBoost offered the highest performance for the remaining cohorts. The SD across the different folds was nominal, confirming the stability of the classifiers. <xref rid="figure4" ref-type="fig">Figure 4</xref> shows the receiver operating characteristic curves for the best models from each cohort.</p>
        <fig id="figure4" position="float">
          <label>Figure 4</label>
          <caption>
            <p>Receiver operating characteristic curves for support vector machine, adaptive boosting, and adaptive boosting for the three cohorts, respectively (left to right). AUC: area under the curve; ROC: receiver operating characteristic.</p>
          </caption>
          <graphic xlink:href="jmir_v23i8e26843_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <p>To further investigate the prediction efficacy of the ML-based classifiers, we evaluated the prediction performance of the best-performing classifier for all three cohorts by testing the prediction of graft failure events by a classifier trained for a specific cohort with data from other cohorts, that is, testing the classifier for cohort 2 with randomly selected data from cohorts 1 and 3. The underlying assumption is that the classifier should not produce good prediction results for data from other cohorts. As this evaluation considers survivors across progressive cohorts, we used the F1 score to measure prediction performance. A sound prediction model for cohort 2 will give a high graft failure prediction score for data from cohort 1 but a low prediction score for data from cohort 3, the rationale being that the overlapping cohort 2 classifier is trained on graft failure cases in both cohorts 1 and 2<italic>.</italic> Therefore, the prediction model for cohort 2 should give a high prediction score for predicting graft failures from year<sub>0</sub> to year<sub>5</sub>, but when applied to cohort 3<italic>,</italic> the cohort 2 prediction model would be unable to predict graft failure as it has not been trained on cohort 3 data. <xref ref-type="table" rid="table6">Table 6</xref> provides the cross-cohort prediction scores for the best classifiers for each cohort.</p>
        <table-wrap position="float" id="table6">
          <label>Table 6</label>
          <caption>
            <p>Prediction performance (F1 scores) for cross-cohort predictions using overlapped cohorts.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="400"/>
            <col width="200"/>
            <col width="200"/>
            <col width="200"/>
            <thead>
              <tr valign="top">
                <td>Model</td>
                <td>Cohort 1</td>
                <td>Cohort 2</td>
                <td>Cohort 3</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>SVM<sup>a</sup> (cohort 1)</td>
                <td>0.6</td>
                <td>0.42</td>
                <td>0.29</td>
              </tr>
              <tr valign="top">
                <td>AdaBoost<sup>b</sup> (cohort 2)</td>
                <td>0.79</td>
                <td>0.87</td>
                <td>0.58</td>
              </tr>
              <tr valign="top">
                <td>AdaBoost (cohort 3)</td>
                <td>0.72</td>
                <td>0.75</td>
                <td>0.87</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table6fn1">
              <p><sup>a</sup>SVM: support vector machine.</p>
            </fn>
            <fn id="table6fn2">
              <p><sup>b</sup>AdaBoost: adaptive boosting.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Results of Wilcoxon Signed-Rank Test</title>
        <p>To determine if the prediction differences between the different models were statistically significant, we used the Wilcoxon signed-rank test to compare the scores between different models. Because the best scores in each cohort were usually produced by SVM and AdaBoost models, the Wilcoxon signed-rank test was conducted with each combination of these models with the other models.</p>
        <p><xref ref-type="table" rid="table7">Table 7</xref> shows the results based on the F1 score, and the <italic>P</italic> values between the models were quite small and less than the threshold value of <italic>P</italic>=.05, confirming that the performance difference is statistically significant.</p>
        <table-wrap position="float" id="table7">
          <label>Table 7</label>
          <caption>
            <p>The results for Wilcoxon signed-rank test (F1).</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="250"/>
            <col width="150"/>
            <col width="150"/>
            <col width="150"/>
            <col width="150"/>
            <col width="150"/>
            <thead>
              <tr valign="top">
                <td>Cohort</td>
                <td colspan="5"><italic>P</italic> value (F1)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>SVM<sup>a</sup>-AdaBoost<sup>b,c</sup></td>
                <td>SVM-ANN<sup>d,e</sup></td>
                <td>SVM-RF<sup>f,g</sup></td>
                <td>AdaBoost-RF<sup>h</sup></td>
                <td>AdaBoost-ANN<sup>i</sup></td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Cohort 1</td>
                <td>.003</td>
                <td>.003</td>
                <td>.003</td>
                <td>.003</td>
                <td>.003</td>
              </tr>
              <tr valign="top">
                <td>Cohort 2</td>
                <td>.003</td>
                <td>.003</td>
                <td>.003</td>
                <td>.003</td>
                <td>.03</td>
              </tr>
              <tr valign="top">
                <td>Cohort 3</td>
                <td>&#60;.001</td>
                <td>&#60;.001</td>
                <td>&#60;.001</td>
                <td>&#60;.001</td>
                <td>&#60;.001</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table7fn1">
              <p><sup>a</sup>SVM: support vector machine.</p>
            </fn>
            <fn id="table7fn2">
              <p><sup>b</sup>AdaBoost: adaptive boosting.</p>
            </fn>
            <fn id="table7fn3">
              <p><sup>c</sup>H<sub>o</sub> (null hypothesis): SVM=AdaBoost; H<sub>a</sub> (alternative hypothesis): SVM≠AdaBoost.</p>
            </fn>
            <fn id="table7fn4">
              <p><sup>d</sup>ANN: artificial neural network.</p>
            </fn>
            <fn id="table7fn5">
              <p><sup>e</sup>H<sub>o</sub>: SVM=EANN; H<sub>a</sub>: SVM≠EANN.</p>
            </fn>
            <fn id="table7fn6">
              <p><sup>f</sup>RF: random forest.</p>
            </fn>
            <fn id="table7fn7">
              <p><sup>g</sup>H<sub>o</sub>: SVM=RF; H<sub>a</sub>: SVM≠RF.</p>
            </fn>
            <fn id="table7fn8">
              <p><sup>h</sup>H<sub>o</sub>: AdaBoost=RF; H<sub>a</sub>: AdaBoost≠RF.</p>
            </fn>
            <fn id="table7fn9">
              <p><sup>i</sup>H<sub>o</sub>: AdaBoost=ANN; H<sub>a</sub>: AdaBoost≠ANN.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Analysis of the Influence of Clinical Features Over Time Toward Graft Status Prediction</title>
        <sec>
          <title>Overview</title>
          <p>The second objective of this research is to analyze the influence of clinical features on the prediction of graft survival over different periods. The intent was to understand the factors responsible for graft survival at different periods after transplant. The nonoverlapped cohorts (0-1 years, &#62;1-5 years, and &#62;5-17 years following a transplant) were used to ensure that there was no cascading influence of the features over time. For comparison purposes, we also examined the feature importance for overlapping cohorts. The feature importance scores represent the relative importance of the feature among all features, that is, the total of all the features’ importance scores add up to 100%; hence, if one feature gains a higher importance score, it will be at the expense of the importance score of other features.</p>
          <p><xref rid="figure5" ref-type="fig">Figures 5</xref> and <xref rid="figure6" ref-type="fig">6</xref> illustrate the individual feature importance scores across all the nonoverlapped and overlapped cohorts, respectively.</p>
          <fig id="figure5" position="float">
            <label>Figure 5</label>
            <caption>
              <p>Changing relevance of features based on nonoverlapped time cohorts.</p>
            </caption>
            <graphic xlink:href="jmir_v23i8e26843_fig5.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
          <fig id="figure6" position="float">
            <label>Figure 6</label>
            <caption>
              <p>Changing relevance of features based on overlapped time cohorts.</p>
            </caption>
            <graphic xlink:href="jmir_v23i8e26843_fig6.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
          <p>In general, the top 10% of the important features remained consistent in both the nonoverlapped and overlapped cohorts; however, we note that the nonoverlapped cohorts identified a larger group of important features. For instance, peak panel reactive antibody (Pkpra) and pre-emptive recipient status (Preemptive) had negligible importance in overlapping cohorts but were important during the 2-5 years and 6-17 years in the nonoverlapping cohorts. <xref ref-type="table" rid="table8">Table 8</xref> shows the feature importance across the three cohorts.</p>
          <table-wrap position="float" id="table8">
            <label>Table 8</label>
            <caption>
              <p>Ranking of the top-10 features across the time cohorts with feature importance scores<sup>a</sup>.</p>
            </caption>
            <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
              <col width="70"/>
              <col width="200"/>
              <col width="190"/>
              <col width="190"/>
              <col width="180"/>
              <col width="170"/>
              <thead>
                <tr valign="top">
                  <td>Rank</td>
                  <td>Cohort 1, feature, relative score (%)</td>
                  <td colspan="2">Cohort 2</td>
                  <td colspan="2">Cohort 3</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>Feature, relative score (%)</td>
                  <td>Importance (%), rank change</td>
                  <td>Feature, relative score (%)</td>
                  <td>Importance (%), rank change</td>
                </tr>
              </thead>
              <tbody>
                <tr valign="top">
                  <td>1</td>
                  <td>HLAMM<sup>b</sup> (13)</td>
                  <td>ESRDDXSIMP<sup>c</sup> (18)</td>
                  <td>
                    <italic>+100, +2</italic>
                  </td>
                  <td>RAGETX<sup>d</sup> (16)</td>
                  <td>+77, <italic>+3</italic></td>
                </tr>
                <tr valign="top">
                  <td>2</td>
                  <td>VINTAGE<sup>e</sup> (12)</td>
                  <td>VINTAGE (11)</td>
                  <td>–8, <italic>0</italic></td>
                  <td>RDM2<sup>f</sup> (16)</td>
                  <td>&#62;+100, <italic>&#62;+10</italic></td>
                </tr>
                <tr valign="top">
                  <td>3</td>
                  <td>ESRDDXSIMP (9)</td>
                  <td>HLAMM (10)</td>
                  <td>–23, –<italic>2</italic></td>
                  <td>ESRDDXSIMP (13)</td>
                  <td>–27, –<italic>2</italic></td>
                </tr>
                <tr valign="top">
                  <td>4</td>
                  <td>DRCMV<sup>g</sup> (8)</td>
                  <td>RAGETX (9)</td>
                  <td>+78, <italic>+6</italic></td>
                  <td>FUNCTSTAT<sup>h</sup> (12)</td>
                  <td>&#62;+100, <italic>+3</italic></td>
                </tr>
                <tr valign="top">
                  <td>5</td>
                  <td>DRRACE<sup>i</sup> (8)</td>
                  <td>DAGE<sup>j</sup> (6)</td>
                  <td>50, <italic>+2</italic></td>
                  <td>DAGE (5)</td>
                  <td>–16, <italic>0</italic></td>
                </tr>
                <tr valign="top">
                  <td>6</td>
                  <td>FUNCTSTAT (7)</td>
                  <td>DRRACE (4)</td>
                  <td>–100, –<italic>1</italic></td>
                  <td>DRRACE (3)</td>
                  <td>–25, <italic>0</italic></td>
                </tr>
                <tr valign="top">
                  <td>7</td>
                  <td>DAGE (4)</td>
                  <td>FUNCTSTAT (4)</td>
                  <td>–75, –<italic>1</italic></td>
                  <td>ECD<sup>k</sup> (3)</td>
                  <td>&#62;+100, <italic>&#62;+3</italic></td>
                </tr>
                <tr valign="top">
                  <td>8</td>
                  <td>RCAD<sup>l</sup> (4)</td>
                  <td>PKPRA<sup>m</sup> (3)</td>
                  <td>+50, <italic>&#62;+3</italic></td>
                  <td>VINTAGE (2)</td>
                  <td>&#62;–100, –<italic>6</italic></td>
                </tr>
                <tr valign="top">
                  <td>9</td>
                  <td>RDM2 (3)</td>
                  <td>PREEMPTIVE<sup>n</sup> (3)</td>
                  <td>+50, <italic>&#62;+1</italic></td>
                  <td>PREEMPTIVE (2)</td>
                  <td>–33, <italic>0</italic></td>
                </tr>
                <tr valign="top">
                  <td>10</td>
                  <td>RAGETX (2)</td>
                  <td>DRCMV (2)</td>
                  <td>–75, –<italic>6</italic></td>
                  <td>RWT2 (2)</td>
                  <td>0, <italic>0</italic></td>
                </tr>
                <tr valign="top">
                  <td>Rest</td>
                  <td>Rest (31)</td>
                  <td>Rest (30)</td>
                  <td>Rest (30)</td>
                  <td>Rest (26)</td>
                  <td>Rest (26)</td>
                </tr>
              </tbody>
            </table>
            <table-wrap-foot>
              <fn id="table8fn1">
                <p><sup>a</sup>Importance (%) and rank change is shown in italics.</p>
              </fn>
              <fn id="table8fn2">
                <p><sup>b</sup>HLAMM: HLA antigen mismatch.</p>
              </fn>
              <fn id="table8fn3">
                <p><sup>c</sup>ESRDDXSIMP: simplified end-stage renal disease diagnosis.</p>
              </fn>
              <fn id="table8fn4">
                <p><sup>d</sup>RAGETX: recipient age.</p>
              </fn>
              <fn id="table8fn5">
                <p><sup>e</sup>VINTAGE: number of years on dialysis before transplant.</p>
              </fn>
              <fn id="table8fn6">
                <p><sup>f</sup>RDM2: recipient diabetes status.</p>
              </fn>
              <fn id="table8fn7">
                <p><sup>g</sup>DRCMV: donor-recipient cytomegalovirus.</p>
              </fn>
              <fn id="table8fn8">
                <p><sup>h</sup>FUNCTSTAT: functional status of the recipient.</p>
              </fn>
              <fn id="table8fn9">
                <p><sup>i</sup>DRRACE: donor-recipient race.</p>
              </fn>
              <fn id="table8fn10">
                <p><sup>j</sup>DAGE: donor age.</p>
              </fn>
              <fn id="table8fn11">
                <p><sup>k</sup>ECD: expanded criteria donor.</p>
              </fn>
              <fn id="table8fn12">
                <p><sup>l</sup>RCAD: recipient coronary artery disease.</p>
              </fn>
              <fn id="table8fn13">
                <p><sup>m</sup>PKPRA: peak panel reactive antibody.</p>
              </fn>
              <fn id="table8fn14">
                <p><sup>n</sup>PREEMPTIVE: pre-emptive transplant.</p>
              </fn>
              <fn id="table8fn15">
                <p><sup>o</sup>RWT2: recipient weight.</p>
              </fn>
            </table-wrap-foot>
          </table-wrap>
          <p>Below, we analyze the importance of features in each cohort and show the influence of features over time using nonoverlapping cohorts.</p>
        </sec>
        <sec>
          <title>Feature Importance for Cohort 1</title>
          <p>According to the top features shown in <xref ref-type="table" rid="table8">Table 8</xref>, HLAMMs and the number of years on dialysis before transplant (VINTAGE) were the most important features with a relative importance of over 10%. This observation has been confirmed in other studies [<xref ref-type="bibr" rid="ref32">32</xref>,<xref ref-type="bibr" rid="ref36">36</xref>]. Donor-recipient CMV status, donor-recipient race, end-stage renal disease diagnosis (ESRDDXSIMP), and functional status of the recipient were ranked as having medium importance with a relative score between 5% and 10%. Donor-recipient race pairs and donor-recipient CMV pairs were noted to have more predictive influence in cohort 1 than in the other two cohorts.</p>
        </sec>
        <sec>
          <title>Feature Importance for Cohort 2</title>
          <p>Both HLAMMs and VINTAGE remained highly important in cohort 2. In addition, ESRDDXSIMP was noted as a highly important feature. Interestingly, we note that few features, such as donor age and recipient age, were rather insignificant in cohort 1 but were noted to be significant in both cohort 2 and further in cohort 3.</p>
        </sec>
        <sec>
          <title>Feature Importance for Cohort 3</title>
          <p>ESRDDXSIMP showed a relative downward trend; however, it remained a highly significant feature. Unlike earlier cohorts, HLAMMs and VINTAGE were noted to not maintain their importance in the long term, whereas the recipient’s status of diabetes was noted to be the most important feature, along with recipient age and their functional status. Donor age was noted to maintain a medium importance score between 5% and 10%.</p>
          <p><xref rid="figure7" ref-type="fig">Figure 7</xref> presents a heat map of the importance score to illustrate the changing influence of the top 25 features across the three cohorts. In addition to the top 10 features (<xref ref-type="table" rid="table8">Table 8</xref>), the heat map details the contribution of relatively less important features. It was interesting to see that few features (such as donor weight, recipient weight, and donor hypertension) had static importance across the three cohorts. This indicates that although these features were not deterministic for the cohorts, they possessed a certain value for the prediction models.</p>
          <fig id="figure7" position="float">
            <label>Figure 7</label>
            <caption>
              <p>Changing relevance of top 25 features over the three cohorts. AHD1: donor-recipient height difference; CIT: cold ischemia time; DAGE: donor age; DHT100: donor height; DHTN2: donor hypertension; DONCREAT: donor creatinine level; DRACESIMP: donor race; DRCMV: donor-recipient cytomegalovirus; DRRACE: donor-recipient race; DRWT: donor-recipient weight difference; DWT: donor weight; ECD: expanded criteria donor; ESRDDXSIMP: simplified end-stage renal disease diagnosis; FUNCTSTAT: functional status of the recipient; HLAMM: number of HLA mismatches; PKPRA: peak panel reactive antibody; PREEMPTIVE: preemptive transplant; RAGETX: recipient age; RCAD: recipient coronary artery disease; RDM2: recipient diabetes; RHT2100: recipient height; RHTN: recipient hypertension; RRACESIMP: recipient race; RWT2: recipient weight; VINTAGE: number of years on dialysis before transplantation.</p>
            </caption>
            <graphic xlink:href="jmir_v23i8e26843_fig7.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
          <p>Analysis of the values of categorical features provided novel insights into the influence of a feature. <xref rid="figure8" ref-type="fig">Figure 8</xref> presents a heat map of the importance of the value of the categorical features generated after transforming them into dummy features.</p>
          <fig id="figure8" position="float">
            <label>Figure 8</label>
            <caption>
              <p>Changing relevance of top 25 features (including dummy features) over the three cohorts. CIT: cold ischemia time; DAGE: donor age; DBMI: donor BMI; DHT100: donor height; DONCREAT: donor creatinine level; DRCMV_2: Donor positive recipient positive; DRRACE_1: Donor white recipient white; DWT: donor weight; ECD_0: Expanded criteria donor: no; ECD_1: Expanded criteria donor: yes; ESRDDXSIMP_2: End stage renal disease: diabetes mellitus; ESRDDXSIMP_3: End stage renal disease: polycystic kidney disease; ESRDDXSIMP_4: End stage renal disease: hypertension; FUNCTSTAT_1: Functional status of recipient: 100% no complaints; HLAMM _5: Number of human leukocyte antigen mismatches: 5; PKPRA: peak panel reactive antibody; PREEMPTIVE_1: Preemptive transplant: yes; PREEMPTIVE_2: Preemptive transplant: no; RAGETX: recipient age; RBMI2: recipient BMI; RDM2_0: Recipient diabetes: no; RDM2_1: Recipient diabetes: yes; RHT2100: recipient height; RWT2: recipient weight; VINTAGE: number of years on dialysis before transplantation.</p>
            </caption>
            <graphic xlink:href="jmir_v23i8e26843_fig8.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>The cross-cohort prediction results (<xref ref-type="table" rid="table6">Table 6</xref>) confirm the efficacy of the classifiers—the prediction model for cohort 3 (ie, AdaBoost) correctly offers a high prediction score for data from cohort 1 (72%) and cohort 2 (75%). The prediction model for cohort 2 offers a high prediction score for cohort 1 data (79%) but a low prediction score for cohort 3 (58%) data. The classifier for cohort 1 (ie, SVM) gave low prediction scores for data from cohort 2 (42%) and cohort 3 (29%). Interestingly, the highest prediction score by a cohort-specific classifier was always achieved for data from its respective cohort. The prediction modeling results confirmed that the prediction models were highly sensitive to their respective cohorts.</p>
      </sec>
      <sec>
        <title>Comparing Prediction Performance With Prior Studies</title>
        <p>We compared the prediction performance of our ML-based prediction models with comparable organ transplant studies that involved similar-sized observations and temporal windows. <xref ref-type="table" rid="table9">Table 9</xref> summarizes the findings of the two studies for each cohort. There have been several other studies [<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref32">32</xref>,<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref37">37</xref>,<xref ref-type="bibr" rid="ref38">38</xref>] to predict the short-term graft status of different organ transplants, but because of their small data set, these do not serve as a meaningful comparison.</p>
        <table-wrap position="float" id="table9">
          <label>Table 9</label>
          <caption>
            <p>Prediction scores of similar studies.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="100"/>
            <col width="180"/>
            <col width="150"/>
            <col width="90"/>
            <col width="100"/>
            <col width="100"/>
            <col width="130"/>
            <col width="150"/>
            <thead>
              <tr valign="top">
                <td>Time</td>
                <td>Study</td>
                <td>Model</td>
                <td>Size</td>
                <td>Data set</td>
                <td>Metric</td>
                <td>Score (%)</td>
                <td>Our score (%)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>1 year</td>
                <td>Lin et al [<xref ref-type="bibr" rid="ref16">16</xref>]</td>
                <td>ANN<sup>a</sup> and LR<sup>b</sup></td>
                <td>46,414</td>
                <td>UNOS<sup>c</sup></td>
                <td>AUC<sup>d</sup></td>
                <td>73</td>
                <td>82</td>
              </tr>
              <tr valign="top">
                <td>1 year</td>
                <td>Dag et al [<xref ref-type="bibr" rid="ref23">23</xref>]</td>
                <td>LR</td>
                <td>15,580</td>
                <td>UNOS</td>
                <td>AUC</td>
                <td>63</td>
                <td>82</td>
              </tr>
              <tr valign="top">
                <td>5 years</td>
                <td>Tiong et al [<xref ref-type="bibr" rid="ref39">39</xref>]</td>
                <td>Nomogram</td>
                <td>20,085</td>
                <td>UNOS</td>
                <td>C-index<sup>e</sup></td>
                <td>71</td>
                <td>69</td>
              </tr>
              <tr valign="top">
                <td>5 years</td>
                <td>Lin et al [<xref ref-type="bibr" rid="ref16">16</xref>]</td>
                <td>ANN</td>
                <td>17,856</td>
                <td>UNOS</td>
                <td>AUC</td>
                <td>77</td>
                <td>69</td>
              </tr>
              <tr valign="top">
                <td>7 years</td>
                <td>Lin et al [<xref ref-type="bibr" rid="ref16">16</xref>]</td>
                <td>ANN</td>
                <td>10,250</td>
                <td>UNOS</td>
                <td>AUC</td>
                <td>82</td>
                <td>81</td>
              </tr>
              <tr valign="top">
                <td>14 years</td>
                <td>Luck et al [<xref ref-type="bibr" rid="ref40">40</xref>]</td>
                <td>ANN</td>
                <td>46,098</td>
                <td>SRTR<sup>f</sup></td>
                <td>C-index</td>
                <td>65</td>
                <td>81</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table9fn1">
              <p><sup>a</sup>ANN: artificial neural network.</p>
            </fn>
            <fn id="table9fn2">
              <p><sup>b</sup>LR: logistic regression.</p>
            </fn>
            <fn id="table9fn3">
              <p><sup>c</sup>UNOS: United Network of Organ Sharing.</p>
            </fn>
            <fn id="table9fn4">
              <p><sup>d</sup>AUC: area under the curve.</p>
            </fn>
            <fn id="table9fn5">
              <p><sup>e</sup>C-index: concordance index.</p>
            </fn>
            <fn id="table9fn6">
              <p><sup>f</sup>SRTR: Scientific Registry of Transplant Recipients.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>When comparing our results with prior studies, it is noted that although our cohort 2 prediction performance (ie, graft status prediction over a 5-year period) is lower than that of Lin et al [<xref ref-type="bibr" rid="ref16">16</xref>], it was based on a much smaller data set that included 10,641 survivals and 7215 failures, whereas we analyzed 23,475 failures and 29,352 survivals. Similarly, Tiong et al [<xref ref-type="bibr" rid="ref39">39</xref>] analyzed a smaller sample of 20,085 living donor transplant recipients to achieve a concordance index of 71%. Our cohort 3 prediction performance is marginally lower compared with Lin et al [<xref ref-type="bibr" rid="ref16">16</xref>], who predicted a 7-year graft survival with an 82% AUC score, whereas our cohort 3 prediction model covers a much longer (17 years) temporal window and achieves a comparable prediction score. Using a similar number of transplants, Luck et al [<xref ref-type="bibr" rid="ref40">40</xref>] achieved a much lower concordance index between 63% and 66% for 14-years graft survival.</p>
      </sec>
      <sec>
        <title>Limitations and Future Work</title>
        <p>A limitation of our research lies in the removal of censored instances. We removed all successful cases that were censored before 8 years following transplant. Although this type of approach has previously been used, including censored cases is a potential consideration for future analyses.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>Understanding the impact of donor and recipient factors that predict short- and long-term kidney transplant allograft survival is important for patients and providers. Kidney transplantation is the optimal form of kidney replacement therapy, but kidney allografts are a limited resource. In addition, the alternative to kidney transplantation (ie, dialysis) is considerably costlier.</p>
        <p>In this study, we present an ML-based framework to predict the status of kidney allografts, based on donor-recipient features, over a period of 17 years. We applied ML-based data analysis methods for feature engineering to reduce data dimensionality, develop prediction models for three distinct temporal cohorts, and investigate the changing relevance of clinical features across different temporal cohorts. We introduced the concept of nonoverlapped cohorts to analyze the changing relevance of features in three defined periods. In conclusion, our results emphasize that ML can be effective in predicting graft survival using donor and recipient factors that are routinely collected as part of patient care. As a next step, we plan to incorporate the prediction models into clinical care at the time of allocation; models that best predict short- and long-term kidney graft survival may be used as a pragmatic prognostic tool to aid clinicians in maximizing the best possible matching of donors and recipients while preserving existing allocation rules that are used to promote equity [<xref ref-type="bibr" rid="ref41">41</xref>].</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Supplementary tables.</p>
        <media xlink:href="jmir_v23i8e26843_app1.doc" xlink:title="DOC File , 24 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">AdaBoost</term>
          <def>
            <p>adaptive boosting</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">ANN</term>
          <def>
            <p>artificial neural network</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">AUC</term>
          <def>
            <p>area under the curve</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">CMV</term>
          <def>
            <p>cytomegalovirus</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">ESRDDXSIMP</term>
          <def>
            <p>end-stage renal disease diagnosis</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">LR</term>
          <def>
            <p>logistic regression</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">ML</term>
          <def>
            <p>machine learning</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">RF</term>
          <def>
            <p>random forest</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb9">SMOTE</term>
          <def>
            <p>Synthetic Minority Oversampling Technique</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb10">SRTR</term>
          <def>
            <p>Scientific Registry of Transplant Recipients</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb11">SVM</term>
          <def>
            <p>support vector machine</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb12">VINTAGE</term>
          <def>
            <p>number of years on dialysis before transplant</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>The data reported here have been supplied by the Hennepin Healthcare Research Institute as the contractor for the SRTR. The interpretation and reporting of these data are the responsibility of the authors and in no way should be seen as an official policy of or interpretation by the SRTR or the US Government.</p>
    </ack>
    <fn-group>
      <fn fn-type="con">
        <p>SAAN and SSRA were responsible for the overall data analysis methodology, data analysis using ML algorithms, evaluation of the data analysis results, and writing of the manuscript. KT and AV provided clinical expertise in defining the problem, interpretation of the data, preprocessing of the data and interpretation of the results, providing the data from the data source, and editing the manuscript for clinical clarity and purpose. PCR facilitated the setting up and conducting of data analysis experiments. All authors critically reviewed the manuscript for scientific content and approved the final manuscript for publication.</p>
      </fn>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sullivan</surname>
              <given-names>CE</given-names>
            </name>
          </person-group>
          <article-title>Kidney Transplantation</article-title>
          <source>Transplantation</source>
          <year>1968</year>
          <volume>6</volume>
          <issue>5</issue>
          <fpage>753</fpage>
          <pub-id pub-id-type="doi">10.1097/00007890-196808000-00031</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hall</surname>
              <given-names>Yoshio N</given-names>
            </name>
            <name name-style="western">
              <surname>Chertow</surname>
              <given-names>Glenn M</given-names>
            </name>
          </person-group>
          <article-title>End stage renal disease</article-title>
          <source>BMJ Clin Evid</source>
          <year>2007</year>
          <month>10</month>
          <day>17</day>
          <volume>2007</volume>
          <fpage>1048</fpage>
          <lpage>59</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/19450356"/>
          </comment>
          <pub-id pub-id-type="medline">19450356</pub-id>
          <pub-id pub-id-type="pii">2002</pub-id>
          <pub-id pub-id-type="pmcid">PMC2943808</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Go</surname>
              <given-names>AS</given-names>
            </name>
            <name name-style="western">
              <surname>Chertow</surname>
              <given-names>GM</given-names>
            </name>
            <name name-style="western">
              <surname>Fan</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>McCulloch</surname>
              <given-names>CE</given-names>
            </name>
            <name name-style="western">
              <surname>Hsu</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Chronic Kidney Disease and the Risks of Death, Cardiovascular Events, and Hospitalization</article-title>
          <source>N Engl J Med</source>
          <year>2004</year>
          <month>09</month>
          <day>23</day>
          <volume>351</volume>
          <issue>13</issue>
          <fpage>1296</fpage>
          <lpage>1305</lpage>
          <pub-id pub-id-type="doi">10.1056/nejmoa041031</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rashidi Khazaee</surname>
              <given-names>Parviz</given-names>
            </name>
            <name name-style="western">
              <surname>Bagherzadeh</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Niazkhani</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Pirnejad</surname>
              <given-names>Habibollah</given-names>
            </name>
          </person-group>
          <article-title>A dynamic model for predicting graft function in kidney recipients' upcoming follow up visits: A clinical application of artificial neural network</article-title>
          <source>Int J Med Inform</source>
          <year>2018</year>
          <month>11</month>
          <volume>119</volume>
          <fpage>125</fpage>
          <lpage>133</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1016/j.ijmedinf.2018.09.012"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.ijmedinf.2018.09.012</pub-id>
          <pub-id pub-id-type="medline">30342680</pub-id>
          <pub-id pub-id-type="pii">S1386-5056(18)30111-4</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Schold</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Segev</surname>
              <given-names>Dorry L</given-names>
            </name>
          </person-group>
          <article-title>Increasing the pool of deceased donor organs for kidney transplantation</article-title>
          <source>Nat Rev Nephrol</source>
          <year>2012</year>
          <month>03</month>
          <day>27</day>
          <volume>8</volume>
          <issue>6</issue>
          <fpage>325</fpage>
          <lpage>31</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/nrneph.2012.60"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/nrneph.2012.60</pub-id>
          <pub-id pub-id-type="medline">22450438</pub-id>
          <pub-id pub-id-type="pii">nrneph.2012.60</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="web">
          <source>Conservative Care - The Kidney Foundation of Canada &#124; La Fondation canadienne du rein</source>
          <access-date>2019-11-15</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.kidney.ca/conservative-care">https://www.kidney.ca/conservative-care</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="web">
          <source>About Chronic Kidney Disease &#124; National Kidney Foundation</source>
          <access-date>2019-11-15</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.kidney.org/atoz/content/about-chronic-kidney-disease">https://www.kidney.org/atoz/content/about-chronic-kidney-disease</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Perl</surname>
              <given-names>Jeffrey</given-names>
            </name>
          </person-group>
          <article-title>Kidney transplant failure: failing kidneys, failing care?</article-title>
          <source>Clin J Am Soc Nephrol</source>
          <year>2014</year>
          <month>07</month>
          <volume>9</volume>
          <issue>7</issue>
          <fpage>1153</fpage>
          <lpage>5</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://cjasn.asnjournals.org/cgi/pmidlookup?view=long&#38;pmid=24903388"/>
          </comment>
          <pub-id pub-id-type="doi">10.2215/CJN.04670514</pub-id>
          <pub-id pub-id-type="medline">24903388</pub-id>
          <pub-id pub-id-type="pii">CJN.04670514</pub-id>
          <pub-id pub-id-type="pmcid">PMC4078952</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vinson</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Kiberd</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Davis</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Tennankore</surname>
              <given-names>Kk</given-names>
            </name>
          </person-group>
          <article-title>Nonimmunologic Donor-Recipient Pairing, HLA Matching, and Graft Loss in Deceased Donor Kidney Transplantation</article-title>
          <source>Transplantation Direct</source>
          <year>2019</year>
          <month>1</month>
          <volume>5</volume>
          <issue>1</issue>
          <fpage>e414</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1097/TXD.0000000000000856"/>
          </comment>
          <pub-id pub-id-type="doi">10.1097/txd.0000000000000856</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rao</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Schaubel</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Guidinger</surname>
              <given-names>Mary K</given-names>
            </name>
            <name name-style="western">
              <surname>Andreoni</surname>
              <given-names>Kenneth A</given-names>
            </name>
            <name name-style="western">
              <surname>Wolfe</surname>
              <given-names>Robert A</given-names>
            </name>
            <name name-style="western">
              <surname>Merion</surname>
              <given-names>Robert M</given-names>
            </name>
            <name name-style="western">
              <surname>Port</surname>
              <given-names>Friedrich K</given-names>
            </name>
            <name name-style="western">
              <surname>Sung</surname>
              <given-names>Randall S</given-names>
            </name>
          </person-group>
          <article-title>A comprehensive risk quantification score for deceased donor kidneys: the kidney donor risk index</article-title>
          <source>Transplantation</source>
          <year>2009</year>
          <month>07</month>
          <day>27</day>
          <volume>88</volume>
          <issue>2</issue>
          <fpage>231</fpage>
          <lpage>6</lpage>
          <pub-id pub-id-type="doi">10.1097/TP.0b013e3181ac620b</pub-id>
          <pub-id pub-id-type="medline">19623019</pub-id>
          <pub-id pub-id-type="pii">00007890-200907270-00013</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Young</surname>
              <given-names>Ann</given-names>
            </name>
            <name name-style="western">
              <surname>Knoll</surname>
              <given-names>Greg A</given-names>
            </name>
            <name name-style="western">
              <surname>McArthur</surname>
              <given-names>Eric</given-names>
            </name>
            <name name-style="western">
              <surname>Dixon</surname>
              <given-names>Stephanie N</given-names>
            </name>
            <name name-style="western">
              <surname>Garg</surname>
              <given-names>Amit X</given-names>
            </name>
            <name name-style="western">
              <surname>Lok</surname>
              <given-names>Charmaine E</given-names>
            </name>
            <name name-style="western">
              <surname>Lam</surname>
              <given-names>Ngan N</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>S Joseph</given-names>
            </name>
          </person-group>
          <article-title>Is the Kidney Donor Risk Index a Useful Tool in Non-US Patients?</article-title>
          <source>Can J Kidney Health Dis</source>
          <year>2018</year>
          <volume>5</volume>
          <fpage>2054358118791148</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://journals.sagepub.com/doi/10.1177/2054358118791148?url_ver=Z39.88-2003&#38;rfr_id=ori:rid:crossref.org&#38;rfr_dat=cr_pub%3dpubmed"/>
          </comment>
          <pub-id pub-id-type="doi">10.1177/2054358118791148</pub-id>
          <pub-id pub-id-type="medline">30083367</pub-id>
          <pub-id pub-id-type="pii">10.1177_2054358118791148</pub-id>
          <pub-id pub-id-type="pmcid">PMC6073818</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Senanayake</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>White</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Graves</surname>
              <given-names>Nicholas</given-names>
            </name>
            <name name-style="western">
              <surname>Healy</surname>
              <given-names>Helen</given-names>
            </name>
            <name name-style="western">
              <surname>Baboolal</surname>
              <given-names>Keshwar</given-names>
            </name>
            <name name-style="western">
              <surname>Kularatna</surname>
              <given-names>Sanjeewa</given-names>
            </name>
          </person-group>
          <article-title>Machine learning in predicting graft failure following kidney transplantation: A systematic review of published predictive models</article-title>
          <source>Int J Med Inform</source>
          <year>2019</year>
          <month>10</month>
          <volume>130</volume>
          <fpage>103957</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1016/j.ijmedinf.2019.103957"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.ijmedinf.2019.103957</pub-id>
          <pub-id pub-id-type="medline">31472443</pub-id>
          <pub-id pub-id-type="pii">S1386-5056(19)30297-7</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rao</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Behara</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Agrawal</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Predictive modeling for organ transplantation outcomes</article-title>
          <year>2014</year>
          <month>11</month>
          <day>10</day>
          <conf-name>Proc - IEEE 14th Int Conf Bioinforma Bioeng BIBE  405?408</conf-name>
          <conf-date>2014</conf-date>
          <conf-loc>Boca Raton, FL, USA</conf-loc>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://ieeexplore.ieee.org/document/7033613/"/>
          </comment>
          <pub-id pub-id-type="doi">10.1109/BIBE.2014.58</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Brown</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Elster</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Stevens</surname>
              <given-names>Kristin</given-names>
            </name>
            <name name-style="western">
              <surname>Graybill</surname>
              <given-names>J Christopher</given-names>
            </name>
            <name name-style="western">
              <surname>Gillern</surname>
              <given-names>Suzanne</given-names>
            </name>
            <name name-style="western">
              <surname>Phinney</surname>
              <given-names>Samuel</given-names>
            </name>
            <name name-style="western">
              <surname>Salifu</surname>
              <given-names>Moro O</given-names>
            </name>
            <name name-style="western">
              <surname>Jindal</surname>
              <given-names>Rahul M</given-names>
            </name>
          </person-group>
          <article-title>Bayesian modeling of pretransplant variables accurately predicts kidney graft survival</article-title>
          <source>Am J Nephrol</source>
          <year>2012</year>
          <volume>36</volume>
          <issue>6</issue>
          <fpage>561</fpage>
          <lpage>9</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.karger.com?DOI=10.1159/000345552"/>
          </comment>
          <pub-id pub-id-type="doi">10.1159/000345552</pub-id>
          <pub-id pub-id-type="medline">23221105</pub-id>
          <pub-id pub-id-type="pii">000345552</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Topuz</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Zengul</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Dag</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Almehmi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Yildirim</surname>
              <given-names>Mb</given-names>
            </name>
          </person-group>
          <article-title>Predicting graft survival among kidney transplant recipients: A Bayesian decision support model</article-title>
          <source>Decision Support Systems</source>
          <year>2018</year>
          <month>02</month>
          <volume>106</volume>
          <fpage>97</fpage>
          <lpage>109</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1016/j.dss.2017.12.004"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.dss.2017.12.004</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Horn</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Hurdle</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Goldfarb-Rumyantzev</surname>
              <given-names>Alexander S</given-names>
            </name>
          </person-group>
          <article-title>Single and multiple time-point prediction models in kidney transplant outcomes</article-title>
          <source>J Biomed Inform</source>
          <year>2008</year>
          <month>12</month>
          <volume>41</volume>
          <issue>6</issue>
          <fpage>944</fpage>
          <lpage>52</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(08)00043-9"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2008.03.005</pub-id>
          <pub-id pub-id-type="medline">18442951</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(08)00043-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Axelrod</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Schnitzler</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Xiao</surname>
              <given-names>Huiling</given-names>
            </name>
            <name name-style="western">
              <surname>Irish</surname>
              <given-names>William</given-names>
            </name>
            <name name-style="western">
              <surname>Tuttle-Newhall</surname>
              <given-names>Elizabeth</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>Su-Hsin</given-names>
            </name>
            <name name-style="western">
              <surname>Kasiske</surname>
              <given-names>Bertram L</given-names>
            </name>
            <name name-style="western">
              <surname>Alhamad</surname>
              <given-names>Tarek</given-names>
            </name>
            <name name-style="western">
              <surname>Lentine</surname>
              <given-names>Krista L</given-names>
            </name>
          </person-group>
          <article-title>An economic assessment of contemporary kidney transplant practice</article-title>
          <source>Am J Transplant</source>
          <year>2018</year>
          <month>05</month>
          <volume>18</volume>
          <issue>5</issue>
          <fpage>1168</fpage>
          <lpage>1176</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1111/ajt.14702"/>
          </comment>
          <pub-id pub-id-type="doi">10.1111/ajt.14702</pub-id>
          <pub-id pub-id-type="medline">29451350</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Kanellis</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Mulley</surname>
              <given-names>William R</given-names>
            </name>
          </person-group>
          <article-title>Allocation of deceased donor kidneys: A review of international practices</article-title>
          <source>Nephrology (Carlton)</source>
          <year>2019</year>
          <month>06</month>
          <volume>24</volume>
          <issue>6</issue>
          <fpage>591</fpage>
          <lpage>598</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1111/nep.13548"/>
          </comment>
          <pub-id pub-id-type="doi">10.1111/nep.13548</pub-id>
          <pub-id pub-id-type="medline">30536674</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>George</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Seals</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Aban</surname>
              <given-names>Inmaculada</given-names>
            </name>
          </person-group>
          <article-title>Survival analysis and regression models</article-title>
          <source>J Nucl Cardiol</source>
          <year>2014</year>
          <month>08</month>
          <volume>21</volume>
          <issue>4</issue>
          <fpage>686</fpage>
          <lpage>94</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/24810431"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s12350-014-9908-2</pub-id>
          <pub-id pub-id-type="medline">24810431</pub-id>
          <pub-id pub-id-type="pmcid">PMC4111957</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Serpen</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Selman</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Bayes net classifiers for prediction of renal graft status and survival period</article-title>
          <source>World Academy of Science, Engineering and Technology, Open Science Index 39, International Journal of Biomedical and Biological Engineering</source>
          <year>2010</year>
          <fpage>88</fpage>
          <lpage>94</lpage>
          <pub-id pub-id-type="doi">10.5281/zenodo.1334844</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mamoshina</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Vieira</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Putin</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Zhavoronkov</surname>
              <given-names>Alex</given-names>
            </name>
          </person-group>
          <article-title>Applications of Deep Learning in Biomedicine</article-title>
          <source>Mol Pharm</source>
          <year>2016</year>
          <month>05</month>
          <day>02</day>
          <volume>13</volume>
          <issue>5</issue>
          <fpage>1445</fpage>
          <lpage>54</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1021/acs.molpharmaceut.5b00982"/>
          </comment>
          <pub-id pub-id-type="doi">10.1021/acs.molpharmaceut.5b00982</pub-id>
          <pub-id pub-id-type="medline">27007977</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sadati</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Zafar</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Babu</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Representation Learning with Autoencoders for Electronic Health Records: A Comparative Study</article-title>
          <source>Computing Research Repository</source>
          <access-date>2020-11-20</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/1908.09174">https://arxiv.org/abs/1908.09174</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dag</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Oztekin</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Yucel</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Bulur</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Megahed</surname>
              <given-names>Fm</given-names>
            </name>
          </person-group>
          <article-title>Predicting heart transplantation outcomes through data analytics</article-title>
          <source>Decision Support Systems</source>
          <year>2017</year>
          <month>02</month>
          <volume>94</volume>
          <fpage>42</fpage>
          <lpage>52</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1016/j.dss.2016.10.005"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.dss.2016.10.005</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yoon</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Zame</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Banerjee</surname>
              <given-names>Amitava</given-names>
            </name>
            <name name-style="western">
              <surname>Cadeiras</surname>
              <given-names>Martin</given-names>
            </name>
            <name name-style="western">
              <surname>Alaa</surname>
              <given-names>Ahmed M</given-names>
            </name>
            <name name-style="western">
              <surname>van der Schaar</surname>
              <given-names>Mihaela</given-names>
            </name>
          </person-group>
          <article-title>Personalized survival predictions via Trees of Predictors: An application to cardiac transplantation</article-title>
          <source>PLoS One</source>
          <year>2018</year>
          <volume>13</volume>
          <issue>3</issue>
          <fpage>e0194985</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0194985"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0194985</pub-id>
          <pub-id pub-id-type="medline">29590219</pub-id>
          <pub-id pub-id-type="pii">PONE-D-17-38797</pub-id>
          <pub-id pub-id-type="pmcid">PMC5874060</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Van Belle</surname>
              <given-names>Vanya</given-names>
            </name>
            <name name-style="western">
              <surname>Pelckmans</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Van Huffel</surname>
              <given-names>Sabine</given-names>
            </name>
            <name name-style="western">
              <surname>Suykens</surname>
              <given-names>Johan A K</given-names>
            </name>
          </person-group>
          <article-title>Support vector methods for survival analysis: a comparison between ranking and regression approaches</article-title>
          <source>Artif Intell Med</source>
          <year>2011</year>
          <month>10</month>
          <volume>53</volume>
          <issue>2</issue>
          <fpage>107</fpage>
          <lpage>18</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1016/j.artmed.2011.06.006"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.artmed.2011.06.006</pub-id>
          <pub-id pub-id-type="medline">21821401</pub-id>
          <pub-id pub-id-type="pii">S0933-3657(11)00076-5</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dorado-Moreno</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Pérez-Ortiz</surname>
              <given-names>María</given-names>
            </name>
            <name name-style="western">
              <surname>Gutiérrez</surname>
              <given-names>Pedro A</given-names>
            </name>
            <name name-style="western">
              <surname>Ciria</surname>
              <given-names>Rubén</given-names>
            </name>
            <name name-style="western">
              <surname>Briceño</surname>
              <given-names>Javier</given-names>
            </name>
            <name name-style="western">
              <surname>Hervás-Martínez</surname>
              <given-names>César</given-names>
            </name>
          </person-group>
          <article-title>Dynamically weighted evolutionary ordinal neural network for solving an imbalanced liver transplantation problem</article-title>
          <source>Artif Intell Med</source>
          <year>2017</year>
          <month>03</month>
          <volume>77</volume>
          <fpage>1</fpage>
          <lpage>11</lpage>
          <pub-id pub-id-type="doi">10.1016/j.artmed.2017.02.004</pub-id>
          <pub-id pub-id-type="medline">28545607</pub-id>
          <pub-id pub-id-type="pii">S0933-3657(16)30290-1</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hong</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Iribarne</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Worku</surname>
              <given-names>Berhane</given-names>
            </name>
            <name name-style="western">
              <surname>Takayama</surname>
              <given-names>Hiroo</given-names>
            </name>
            <name name-style="western">
              <surname>Gelijns</surname>
              <given-names>Annetine C</given-names>
            </name>
            <name name-style="western">
              <surname>Naka</surname>
              <given-names>Yoshifumi</given-names>
            </name>
            <name name-style="western">
              <surname>Jeevanandam</surname>
              <given-names>Val</given-names>
            </name>
            <name name-style="western">
              <surname>Russo</surname>
              <given-names>Mark J</given-names>
            </name>
          </person-group>
          <article-title>Who is the high-risk recipient? Predicting mortality after heart transplant using pretransplant donor and recipient risk factors</article-title>
          <source>Ann Thorac Surg</source>
          <year>2011</year>
          <month>08</month>
          <volume>92</volume>
          <issue>2</issue>
          <fpage>520</fpage>
          <lpage>7; discussion 527</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/21683337"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.athoracsur.2011.02.086</pub-id>
          <pub-id pub-id-type="medline">21683337</pub-id>
          <pub-id pub-id-type="pii">S0003-4975(11)00541-8</pub-id>
          <pub-id pub-id-type="pmcid">PMC4243707</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lofaro</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Maestripieri</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Greco</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Papalia</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Mancuso</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Conforti</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Bonofiglio</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Prediction of chronic allograft nephropathy using classification trees</article-title>
          <source>Transplant Proc</source>
          <year>2010</year>
          <month>05</month>
          <volume>42</volume>
          <issue>4</issue>
          <fpage>1130</fpage>
          <lpage>3</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1016/j.transproceed.2010.03.062"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.transproceed.2010.03.062</pub-id>
          <pub-id pub-id-type="medline">20534242</pub-id>
          <pub-id pub-id-type="pii">S0041-1345(10)00350-7</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Medved</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Nugues</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Nilsson</surname>
              <given-names>Johan</given-names>
            </name>
          </person-group>
          <article-title>Predicting the outcome for patients in a heart transplantation queue using deep learning</article-title>
          <source>Annu Int Conf IEEE Eng Med Biol Soc</source>
          <year>2017</year>
          <month>07</month>
          <volume>2017</volume>
          <fpage>74</fpage>
          <lpage>77</lpage>
          <pub-id pub-id-type="doi">10.1109/EMBC.2017.8036766</pub-id>
          <pub-id pub-id-type="medline">29059814</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chawla</surname>
              <given-names>NV</given-names>
            </name>
            <name name-style="western">
              <surname>Bowyer</surname>
              <given-names>KW</given-names>
            </name>
            <name name-style="western">
              <surname>Hall</surname>
              <given-names>LO</given-names>
            </name>
            <name name-style="western">
              <surname>Kegelmeyer</surname>
              <given-names>WP</given-names>
            </name>
          </person-group>
          <article-title>SMOTE: Synthetic Minority Over-sampling Technique</article-title>
          <source>jair</source>
          <year>2002</year>
          <month>06</month>
          <day>01</day>
          <volume>16</volume>
          <fpage>321</fpage>
          <lpage>357</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1613/jair.953"/>
          </comment>
          <pub-id pub-id-type="doi">10.1613/jair.953</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Varoquaux</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Buitinck</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Louppe</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Grisel</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Pedregosa</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Mueller</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Scikit-learn</article-title>
          <source>GetMobile: Mobile Comp. and Comm</source>
          <year>2015</year>
          <month>06</month>
          <volume>19</volume>
          <issue>1</issue>
          <fpage>29</fpage>
          <lpage>33</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1145/2786984.2786995"/>
          </comment>
          <pub-id pub-id-type="doi">10.1145/2786984.2786995</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chollet</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <source>Keras</source>
          <access-date>2020-09-15</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://github.com/fchollet/keras">https://github.com/fchollet/keras</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Medved</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Nugues</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Nilsson</surname>
              <given-names>Johan</given-names>
            </name>
          </person-group>
          <article-title>Selection of an optimal feature set to predict heart transplantation outcomes</article-title>
          <source>Annu Int Conf IEEE Eng Med Biol Soc</source>
          <year>2016</year>
          <month>08</month>
          <volume>2016</volume>
          <fpage>3290</fpage>
          <lpage>3293</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1109/EMBC.2016.7591431"/>
          </comment>
          <pub-id pub-id-type="doi">10.1109/EMBC.2016.7591431</pub-id>
          <pub-id pub-id-type="medline">28269008</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Thongkam</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>AdaBoost algorithm with random forests for predicting breast cancer survivability</article-title>
          <year>2008</year>
          <conf-name>IEEE International Joint Conference on Neural Networks</conf-name>
          <conf-date>1-8 June 2008</conf-date>
          <conf-loc>Hong Kong, China</conf-loc>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1109/IJCNN.2008.4634231"/>
          </comment>
          <pub-id pub-id-type="doi">10.1109/IJCNN.2008.4634231</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tennankore</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Alwayn</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Kiberd</surname>
              <given-names>Bryce A</given-names>
            </name>
          </person-group>
          <article-title>Prolonged warm ischemia time is associated with graft failure and mortality after kidney transplantation</article-title>
          <source>Kidney Int</source>
          <year>2016</year>
          <month>03</month>
          <volume>89</volume>
          <issue>3</issue>
          <fpage>648</fpage>
          <lpage>58</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S0085-2538(15)00064-2"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.kint.2015.09.002</pub-id>
          <pub-id pub-id-type="medline">26880458</pub-id>
          <pub-id pub-id-type="pii">S0085-2538(15)00064-2</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Piros</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Ferenci</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Fleiner</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Andréka</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Fujita</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Főző</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Kovács</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Jánosi</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Comparing machine learning and regression models for mortality prediction based on the Hungarian Myocardial Infarction Registry</article-title>
          <source>Knowledge-Based Systems</source>
          <year>2019</year>
          <month>09</month>
          <volume>179</volume>
          <fpage>1</fpage>
          <lpage>7</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1016/j.knosys.2019.04.027"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.knosys.2019.04.027</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Adegoke</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Banissi</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Barikzai</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Prediction of breast cancer survivability using ensemble algorithms</article-title>
          <year>2017</year>
          <month>10</month>
          <day>18</day>
          <conf-name>International Conference on Smart Systems and Technologies (SST)</conf-name>
          <conf-date>2017</conf-date>
          <conf-loc>Osijek, Croatia</conf-loc>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1109/SST.2017.8188699"/>
          </comment>
          <pub-id pub-id-type="doi">10.1109/SST.2017.8188699</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yoo</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Noh</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>Hajeong</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>Dong Ki</given-names>
            </name>
            <name name-style="western">
              <surname>Lim</surname>
              <given-names>Chun Soo</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>Young Hoon</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>Jung Pyo</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>Gunhee</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>Yon Su</given-names>
            </name>
          </person-group>
          <article-title>A Machine Learning Approach Using Survival Statistics to Predict Graft Survival in Kidney Transplant Recipients: A Multicenter Cohort Study</article-title>
          <source>Sci Rep</source>
          <year>2017</year>
          <month>08</month>
          <day>21</day>
          <volume>7</volume>
          <issue>1</issue>
          <fpage>8904</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41598-017-08008-8"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41598-017-08008-8</pub-id>
          <pub-id pub-id-type="medline">28827646</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41598-017-08008-8</pub-id>
          <pub-id pub-id-type="pmcid">PMC5567098</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tiong</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Goldfarb</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Kattan</surname>
              <given-names>M W</given-names>
            </name>
            <name name-style="western">
              <surname>Alster</surname>
              <given-names>J M</given-names>
            </name>
            <name name-style="western">
              <surname>Thuita</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Wee</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Poggio</surname>
              <given-names>E D</given-names>
            </name>
          </person-group>
          <article-title>Nomograms for predicting graft function and survival in living donor kidney transplantation based on the UNOS Registry</article-title>
          <source>J Urol</source>
          <year>2009</year>
          <month>03</month>
          <volume>181</volume>
          <issue>3</issue>
          <fpage>1248</fpage>
          <lpage>55</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1016/j.juro.2008.10.164"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.juro.2008.10.164</pub-id>
          <pub-id pub-id-type="medline">19167732</pub-id>
          <pub-id pub-id-type="pii">S0022-5347(08)03012-7</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Luck</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Sylvain</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Cardinal</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Deep Learning for Patient-Specific Kidney Graft Survival Analysis</article-title>
          <source>ArXiv</source>
          <year>2017</year>
          <access-date>2020-10-24</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/1705.10245">https://arxiv.org/abs/1705.10245</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Loupy</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Aubert</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Orandi</surname>
              <given-names>Babak J</given-names>
            </name>
            <name name-style="western">
              <surname>Naesens</surname>
              <given-names>Maarten</given-names>
            </name>
            <name name-style="western">
              <surname>Bouatou</surname>
              <given-names>Yassine</given-names>
            </name>
            <name name-style="western">
              <surname>Raynaud</surname>
              <given-names>Marc</given-names>
            </name>
            <name name-style="western">
              <surname>Divard</surname>
              <given-names>Gillian</given-names>
            </name>
            <name name-style="western">
              <surname>Jackson</surname>
              <given-names>Annette M</given-names>
            </name>
            <name name-style="western">
              <surname>Viglietti</surname>
              <given-names>Denis</given-names>
            </name>
            <name name-style="western">
              <surname>Giral</surname>
              <given-names>Magali</given-names>
            </name>
            <name name-style="western">
              <surname>Kamar</surname>
              <given-names>Nassim</given-names>
            </name>
            <name name-style="western">
              <surname>Thaunat</surname>
              <given-names>Olivier</given-names>
            </name>
            <name name-style="western">
              <surname>Morelon</surname>
              <given-names>Emmanuel</given-names>
            </name>
            <name name-style="western">
              <surname>Delahousse</surname>
              <given-names>Michel</given-names>
            </name>
            <name name-style="western">
              <surname>Kuypers</surname>
              <given-names>Dirk</given-names>
            </name>
            <name name-style="western">
              <surname>Hertig</surname>
              <given-names>Alexandre</given-names>
            </name>
            <name name-style="western">
              <surname>Rondeau</surname>
              <given-names>Eric</given-names>
            </name>
            <name name-style="western">
              <surname>Bailly</surname>
              <given-names>Elodie</given-names>
            </name>
            <name name-style="western">
              <surname>Eskandary</surname>
              <given-names>Farsad</given-names>
            </name>
            <name name-style="western">
              <surname>Böhmig</surname>
              <given-names>Georg</given-names>
            </name>
            <name name-style="western">
              <surname>Gupta</surname>
              <given-names>Gaurav</given-names>
            </name>
            <name name-style="western">
              <surname>Glotz</surname>
              <given-names>Denis</given-names>
            </name>
            <name name-style="western">
              <surname>Legendre</surname>
              <given-names>Christophe</given-names>
            </name>
            <name name-style="western">
              <surname>Montgomery</surname>
              <given-names>Robert A</given-names>
            </name>
            <name name-style="western">
              <surname>Stegall</surname>
              <given-names>Mark D</given-names>
            </name>
            <name name-style="western">
              <surname>Empana</surname>
              <given-names>Jean-Philippe</given-names>
            </name>
            <name name-style="western">
              <surname>Jouven</surname>
              <given-names>Xavier</given-names>
            </name>
            <name name-style="western">
              <surname>Segev</surname>
              <given-names>Dorry L</given-names>
            </name>
            <name name-style="western">
              <surname>Lefaucheur</surname>
              <given-names>Carmen</given-names>
            </name>
          </person-group>
          <article-title>Prediction system for risk of allograft loss in patients receiving kidney transplants: international derivation and validation study</article-title>
          <source>BMJ</source>
          <year>2019</year>
          <month>09</month>
          <day>17</day>
          <volume>366</volume>
          <fpage>l4923</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.bmj.com/lookup/pmidlookup?view=long&#38;pmid=31530561"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/bmj.l4923</pub-id>
          <pub-id pub-id-type="medline">31530561</pub-id>
          <pub-id pub-id-type="pmcid">PMC6746192</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
