<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.1d3 20150301//EN" "http://jats.nlm.nih.gov/publishing/1.1d3/JATS-journalpublishing1.dtd">
<article article-type="research-article" dtd-version="1.1d3" xml:lang="en" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<journal-meta>
<journal-id journal-id-type="nlm-ta">PLoS ONE</journal-id>
<journal-id journal-id-type="publisher-id">plos</journal-id>
<journal-id journal-id-type="pmc">plosone</journal-id>
<journal-title-group>
<journal-title>PLOS ONE</journal-title>
</journal-title-group>
<issn pub-type="epub">1932-6203</issn>
<publisher>
<publisher-name>Public Library of Science</publisher-name>
<publisher-loc>San Francisco, CA USA</publisher-loc>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.1371/journal.pone.0209068</article-id>
<article-id pub-id-type="publisher-id">PONE-D-18-03292</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Research Article</subject>
</subj-group>
<subj-group subj-group-type="Discipline-v3"><subject>Medicine and health sciences</subject><subj-group><subject>Surgical and invasive medical procedures</subject><subj-group><subject>Transplantation</subject><subj-group><subject>Organ transplantation</subject><subj-group><subject>Renal transplantation</subject></subj-group></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3"><subject>Medicine and health sciences</subject><subj-group><subject>Surgical and invasive medical procedures</subject><subj-group><subject>Urinary system procedures</subject><subj-group><subject>Renal transplantation</subject></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3"><subject>Research and analysis methods</subject><subj-group><subject>Mathematical and statistical techniques</subject><subj-group><subject>Statistical methods</subject><subj-group><subject>Forecasting</subject></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3"><subject>Physical sciences</subject><subj-group><subject>Mathematics</subject><subj-group><subject>Statistics</subject><subj-group><subject>Statistical methods</subject><subj-group><subject>Forecasting</subject></subj-group></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3"><subject>Biology and life sciences</subject><subj-group><subject>Anatomy</subject><subj-group><subject>Renal system</subject><subj-group><subject>Kidneys</subject></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3"><subject>Medicine and health sciences</subject><subj-group><subject>Anatomy</subject><subj-group><subject>Renal system</subject><subj-group><subject>Kidneys</subject></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3"><subject>Medicine and health sciences</subject><subj-group><subject>Surgical and invasive medical procedures</subject><subj-group><subject>Transplantation</subject><subj-group><subject>Graft survival</subject></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3"><subject>Biology and life sciences</subject><subj-group><subject>Ecology</subject><subj-group><subject>Ecosystems</subject><subj-group><subject>Forests</subject></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3"><subject>Ecology and environmental sciences</subject><subj-group><subject>Ecology</subject><subj-group><subject>Ecosystems</subject><subj-group><subject>Forests</subject></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3"><subject>Ecology and environmental sciences</subject><subj-group><subject>Terrestrial environments</subject><subj-group><subject>Forests</subject></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3"><subject>Physical sciences</subject><subj-group><subject>Mathematics</subject><subj-group><subject>Discrete mathematics</subject><subj-group><subject>Combinatorics</subject><subj-group><subject>Permutation</subject></subj-group></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3"><subject>Engineering and technology</subject><subj-group><subject>Management engineering</subject><subj-group><subject>Decision analysis</subject><subj-group><subject>Decision trees</subject></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3"><subject>Research and analysis methods</subject><subj-group><subject>Decision analysis</subject><subj-group><subject>Decision trees</subject></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3"><subject>Biology and life sciences</subject><subj-group><subject>Organisms</subject><subj-group><subject>Eukaryota</subject><subj-group><subject>Plants</subject><subj-group><subject>Trees</subject></subj-group></subj-group></subj-group></subj-group></subj-group></article-categories>
<title-group>
<article-title>Using machine learning and an ensemble of methods to predict kidney transplant survival</article-title>
<alt-title alt-title-type="running-head">Using machine learning and an ensemble of methods to predict kidney transplant survival</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" corresp="yes" xlink:type="simple">
<contrib-id authenticated="true" contrib-id-type="orcid">http://orcid.org/0000-0002-6404-9140</contrib-id>
<name name-style="western">
<surname>Mark</surname>
<given-names>Ethan</given-names>
</name>
<role content-type="http://credit.casrai.org/">Conceptualization</role>
<role content-type="http://credit.casrai.org/">Data curation</role>
<role content-type="http://credit.casrai.org/">Formal analysis</role>
<role content-type="http://credit.casrai.org/">Investigation</role>
<role content-type="http://credit.casrai.org/">Methodology</role>
<role content-type="http://credit.casrai.org/">Software</role>
<role content-type="http://credit.casrai.org/">Validation</role>
<role content-type="http://credit.casrai.org/">Visualization</role>
<role content-type="http://credit.casrai.org/">Writing – original draft</role>
<role content-type="http://credit.casrai.org/">Writing – review &amp; editing</role>
<xref ref-type="aff" rid="aff001"><sup>1</sup></xref>
<xref ref-type="corresp" rid="cor001">*</xref>
</contrib>
<contrib contrib-type="author" xlink:type="simple">
<name name-style="western">
<surname>Goldsman</surname>
<given-names>David</given-names>
</name>
<role content-type="http://credit.casrai.org/">Conceptualization</role>
<role content-type="http://credit.casrai.org/">Methodology</role>
<role content-type="http://credit.casrai.org/">Project administration</role>
<role content-type="http://credit.casrai.org/">Resources</role>
<role content-type="http://credit.casrai.org/">Supervision</role>
<role content-type="http://credit.casrai.org/">Validation</role>
<role content-type="http://credit.casrai.org/">Writing – review &amp; editing</role>
<xref ref-type="aff" rid="aff001"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author" xlink:type="simple">
<name name-style="western">
<surname>Gurbaxani</surname>
<given-names>Brian</given-names>
</name>
<role content-type="http://credit.casrai.org/">Conceptualization</role>
<role content-type="http://credit.casrai.org/">Funding acquisition</role>
<role content-type="http://credit.casrai.org/">Methodology</role>
<role content-type="http://credit.casrai.org/">Project administration</role>
<role content-type="http://credit.casrai.org/">Resources</role>
<role content-type="http://credit.casrai.org/">Supervision</role>
<role content-type="http://credit.casrai.org/">Validation</role>
<role content-type="http://credit.casrai.org/">Writing – review &amp; editing</role>
<xref ref-type="aff" rid="aff001"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff002"><sup>2</sup></xref>
</contrib>
<contrib contrib-type="author" xlink:type="simple">
<contrib-id authenticated="true" contrib-id-type="orcid">http://orcid.org/0000-0003-2686-546X</contrib-id>
<name name-style="western">
<surname>Keskinocak</surname>
<given-names>Pinar</given-names>
</name>
<role content-type="http://credit.casrai.org/">Funding acquisition</role>
<role content-type="http://credit.casrai.org/">Methodology</role>
<role content-type="http://credit.casrai.org/">Project administration</role>
<role content-type="http://credit.casrai.org/">Resources</role>
<role content-type="http://credit.casrai.org/">Supervision</role>
<role content-type="http://credit.casrai.org/">Validation</role>
<role content-type="http://credit.casrai.org/">Writing – review &amp; editing</role>
<xref ref-type="aff" rid="aff001"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author" xlink:type="simple">
<name name-style="western">
<surname>Sokol</surname>
<given-names>Joel</given-names>
</name>
<role content-type="http://credit.casrai.org/">Conceptualization</role>
<role content-type="http://credit.casrai.org/">Funding acquisition</role>
<role content-type="http://credit.casrai.org/">Methodology</role>
<role content-type="http://credit.casrai.org/">Project administration</role>
<role content-type="http://credit.casrai.org/">Resources</role>
<role content-type="http://credit.casrai.org/">Supervision</role>
<role content-type="http://credit.casrai.org/">Validation</role>
<role content-type="http://credit.casrai.org/">Writing – review &amp; editing</role>
<xref ref-type="aff" rid="aff001"><sup>1</sup></xref>
</contrib>
</contrib-group>
<aff id="aff001"><label>1</label> <addr-line>H. Milton Stewart School of Industrial and Systems Engineering, Georgia Institute of Technology, Atlanta, Georgia, United States of America</addr-line></aff>
<aff id="aff002"><label>2</label> <addr-line>Centers for Disease Control and Prevention, Atlanta, Georgia, United States of America</addr-line></aff>
<contrib-group>
<contrib contrib-type="editor" xlink:type="simple">
<name name-style="western">
<surname>Hatt</surname>
<given-names>Mathieu</given-names>
</name>
<role>Editor</role>
<xref ref-type="aff" rid="edit1"/>
</contrib>
</contrib-group>
<aff id="edit1"><addr-line>INSERM, FRANCE</addr-line></aff>
<author-notes>
<fn fn-type="conflict" id="coi001">
<p>The authors have declared that no competing interests exist.</p>
</fn>
<corresp id="cor001">* E-mail: <email xlink:type="simple">emark3@gatech.edu</email></corresp>
</author-notes>
<pub-date pub-type="epub">
<day>9</day>
<month>1</month>
<year>2019</year>
</pub-date>
<pub-date pub-type="collection">
<year>2019</year>
</pub-date>
<volume>14</volume>
<issue>1</issue>
<elocation-id>e0209068</elocation-id>
<history>
<date date-type="received">
<day>11</day>
<month>2</month>
<year>2018</year>
</date>
<date date-type="accepted">
<day>29</day>
<month>11</month>
<year>2018</year>
</date>
</history>
<permissions>
<license xlink:href="https://creativecommons.org/publicdomain/zero/1.0/" xlink:type="simple">
<license-p>This is an open access article, free of all copyright, and may be freely reproduced, distributed, transmitted, modified, built upon, or otherwise used by anyone for any lawful purpose. The work is made available under the <ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/publicdomain/zero/1.0/" xlink:type="simple">Creative Commons CC0</ext-link> public domain dedication.</license-p>
</license>
</permissions>
<self-uri content-type="pdf" xlink:href="info:doi/10.1371/journal.pone.0209068"/>
<abstract>
<p>We used an ensemble of statistical methods to build a model that predicts kidney transplant survival and identifies important predictive variables. The proposed model achieved better performance, measured by Harrell’s concordance index, than the Estimated Post Transplant Survival model used in the kidney allocation system in the U.S., and other models published recently in the literature. The model has a five-year concordance index of 0.724 (in comparison, the concordance index is 0.697 for the Estimated Post Transplant Survival model, the state of the art currently in use). It combines predictions from random survival forests with a Cox proportional hazards model. The rankings of importance for the model’s variables differ by transplant recipient age. Better survival predictions could eventually lead to more efficient allocation of kidneys and improve patient outcomes.</p>
</abstract>
<funding-group>
<award-group id="award001">
<funding-source>
<institution>This research has been supported in part by the Carlos and Marguerite Mason Trust Foundation, the Arnold Foundation, and by the following Georgia Tech benefactors: William W. George, Andrea Laliberte, Claudia L. and J. Paul Raines, and Richard E. “Rick” and Charlene Zalesky.</institution>
</funding-source>
<principal-award-recipient>
<name name-style="western">
<surname>Sokol</surname>
<given-names>Joel</given-names>
</name>
</principal-award-recipient>
</award-group>
<award-group id="award002">
<funding-source>
<institution>This research has been supported in part by the Carlos and Marguerite Mason Trust Foundation, the Arnold Foundation, and by the following Georgia Tech benefactors: William W. George, Andrea Laliberte, Claudia L. and J. Paul Raines, and Richard E. “Rick” and Charlene Zalesky.</institution>
</funding-source>
<principal-award-recipient>
<contrib-id authenticated="true" contrib-id-type="orcid">http://orcid.org/0000-0002-6404-9140</contrib-id>
<name name-style="western">
<surname>Mark</surname>
<given-names>Ethan</given-names>
</name>
</principal-award-recipient>
</award-group>
<award-group id="award003">
<funding-source>
<institution>This research has been supported in part by the Carlos and Marguerite Mason Trust Foundation, the Arnold Foundation, and by the following Georgia Tech benefactors: William W. George, Andrea Laliberte, Claudia L. and J. Paul Raines, and Richard E. “Rick” and Charlene Zalesky.</institution>
</funding-source>
<principal-award-recipient>
<name name-style="western">
<surname>Goldsman</surname>
<given-names>David</given-names>
</name>
</principal-award-recipient>
</award-group>
<award-group id="award004">
<funding-source>
<institution>This research has been supported in part by the Carlos and Marguerite Mason Trust Foundation, the Arnold Foundation, and by the following Georgia Tech benefactors: William W. George, Andrea Laliberte, Claudia L. and J. Paul Raines, and Richard E. “Rick” and Charlene Zalesky.</institution>
</funding-source>
<principal-award-recipient>
<contrib-id authenticated="true" contrib-id-type="orcid">http://orcid.org/0000-0003-2686-546X</contrib-id>
<name name-style="western">
<surname>Keskinocak</surname>
<given-names>Pinar</given-names>
</name>
</principal-award-recipient>
</award-group>
<award-group id="award005">
<funding-source>
<institution>This research has been supported in part by the Carlos and Marguerite Mason Trust Foundation, the Arnold Foundation, and by the following Georgia Tech benefactors: William W. George, Andrea Laliberte, Claudia L. and J. Paul Raines, and Richard E. “Rick” and Charlene Zalesky.</institution>
</funding-source>
<principal-award-recipient>
<name name-style="western">
<surname>Gurbaxani</surname>
<given-names>Brian</given-names>
</name>
</principal-award-recipient>
</award-group>
<funding-statement>This research has been supported in part by the Carlos and Marguerite Mason Trust, the Arnold Foundation, and by the following Georgia Tech benefactors: William W. George, Andrea Laliberte, Claudia L. and J. Paul Raines, and Richard E. “Rick” and Charlene Zalesky. Any opinions, findings, conclusions, or recommendations are those of the authors and do not necessarily reflect the views of the funding organizations or the CDC.</funding-statement>
</funding-group>
<counts>
<fig-count count="6"/>
<table-count count="2"/>
<page-count count="13"/>
</counts>
<custom-meta-group>
<custom-meta id="data-availability">
<meta-name>Data Availability</meta-name>
<meta-value>Data are available from the United Network for Organ Sharing (UNOS). A STAR (Standard Transplant Analysis and Research) file DVD was requested and obtained from OPTN/UNOS, and can be gotten via an application form from their website: <ext-link ext-link-type="uri" xlink:href="https://optn.transplant.hrsa.gov/data/request-data/" xlink:type="simple">https://optn.transplant.hrsa.gov/data/request-data/</ext-link>. The data is third party and was not collected either by the CDC or Georgia Institute of Technology. Neither the authors, CDC nor Georgia Institute of Technology required special privileges in order to acquire the data. More information on the UNOS data and instructions for researchers to request this data can be found at <ext-link ext-link-type="uri" xlink:href="https://unos.org/data/" xlink:type="simple">https://unos.org/data/</ext-link>. UNOS can also be contacted at (804) 782-4876.</meta-value>
</custom-meta>
</custom-meta-group>
</article-meta>
</front>
<body>
<sec id="sec001" sec-type="intro">
<title>Introduction</title>
<p>In 2013, the Organ Procurement and Transplantation Network (OPTN) adopted a new kidney allocation system using the Estimated Post Transplant Survival (EPTS) score [<xref ref-type="bibr" rid="pone.0209068.ref001">1</xref>, <xref ref-type="bibr" rid="pone.0209068.ref002">2</xref>]. Other kidney transplant survival models such as the Recipient Risk Score (RSS) [<xref ref-type="bibr" rid="pone.0209068.ref003">3</xref>] and Life Years from Transplant (LYFT) [<xref ref-type="bibr" rid="pone.0209068.ref004">4</xref>], have also been proposed by researchers. These techniques use a Cox proportional hazards model, which estimates the probability of a recipient’s post-transplant survival over a given time horizon [<xref ref-type="bibr" rid="pone.0209068.ref005">5</xref>]. The Cox proportional hazards model is the most widely used model for kidney transplant survival estimation [<xref ref-type="bibr" rid="pone.0209068.ref006">6</xref>]. Additional models include a Bayesian Belief Network (BBN) that was used to predict kidney graft failure [<xref ref-type="bibr" rid="pone.0209068.ref007">7</xref>].</p>
<p>We took a different approach, and used an ensemble of methods including random survival forests constructed from conditional inference trees. Our approach first clusters the data (e.g., into cohorts) and then chooses a model that achieves the best performance for each cluster. The advantage of combining different models to predict kidney transplant survival is that different models may work better than others on different cohorts of the data. We assessed the predictive accuracy of our proposed model using various metrics, including Harrell’s concordance index (C-index) [<xref ref-type="bibr" rid="pone.0209068.ref008">8</xref>], which is the percentage of patient pairs correctly “ranked” by the model based on their post-transplant survival duration in a given timeframe. The C-index for the proposed model is better than that of the EPTS model and other kidney transplant survival models proposed recently in the literature [<xref ref-type="bibr" rid="pone.0209068.ref002">2</xref>, <xref ref-type="bibr" rid="pone.0209068.ref004">4</xref>, <xref ref-type="bibr" rid="pone.0209068.ref006">6</xref>]. The results of the model applied to kidney transplant data are presented here, but the approach can be applied to other organs as well.</p>
</sec>
<sec id="sec002">
<title>Data</title>
<p>The dataset was provided by the United Network for Organ Sharing (UNOS) and consists of recipients who underwent kidney transplant surgery in the U.S. from 1987 to 2014 [<xref ref-type="bibr" rid="pone.0209068.ref009">9</xref>, <xref ref-type="bibr" rid="pone.0209068.ref010">10</xref>]. The data includes both living and deceased donors, pediatric and adult recipients, and censored observations. An observation is censored when it does not record a transplant recipient’s survival duration after surgery; in these censored observations, the date of the last follow-up is recorded. All data in this study were fully anonymized prior to access by any of the authors. More information on the UNOS data and instructions for researchers to request this data can be found at <ext-link ext-link-type="uri" xlink:href="https://unos.org/data/" xlink:type="simple">https://unos.org/data/</ext-link>.</p>
<sec id="sec003">
<title>Data preparation</title>
<p>In 2003, the UNOS board of directors instructed the Kidney Allocation Review Subcommittee to review the kidney allocation system [<xref ref-type="bibr" rid="pone.0209068.ref001">1</xref>]. Hence, we tested the following hypothesis: There is a statistically significant difference between the survival curves of recipients who underwent a kidney transplant before and after 2002. A log-rank test and visual inspection of the survival curves verified the significant difference (<xref ref-type="fig" rid="pone.0209068.g001">Fig 1</xref> and <xref ref-type="supplementary-material" rid="pone.0209068.s001">S1 Table</xref> found in the supporting information) [<xref ref-type="bibr" rid="pone.0209068.ref011">11</xref>]. Moreover, starting in 2012, a new allocation system was proposed that used the kidney donor risk index (KDRI) in addition to the EPTS model [<xref ref-type="bibr" rid="pone.0209068.ref012">12</xref>]. Therefore, in the analysis we used data that includes all kidney transplants performed between January 1, 2002 and December 31, 2011. Observations after 2012 would not have a 5-year post-transplant window at the time of this study. 5-year or longer time horizons for kidney transplant survival models have often been used in the literature [<xref ref-type="bibr" rid="pone.0209068.ref006">6</xref>, <xref ref-type="bibr" rid="pone.0209068.ref012">12</xref>, <xref ref-type="bibr" rid="pone.0209068.ref013">13</xref>].</p>
<fig id="pone.0209068.g001" position="float">
<object-id pub-id-type="doi">10.1371/journal.pone.0209068.g001</object-id>
<label>Fig 1</label>
<caption>
<title>Survival probabilities of different transplant cohorts.</title>
<p>The survival probabilities are calculated from the Kaplan-Meier estimate.</p>
</caption>
<graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0209068.g001" xlink:type="simple"/>
</fig>
<p>There were 163,199 observations available during the chosen ten-year time period with 487 variables. We removed variables not present in more than 95% of the observations unless they were identified as important in the previous literature [<xref ref-type="bibr" rid="pone.0209068.ref014">14</xref>–<xref ref-type="bibr" rid="pone.0209068.ref016">16</xref>]. In the latter case we removed variables not present in more than 80% of the observations. We also removed variables that were recorded twice, or were known only after the kidney transplant. The resulting data set had 73 variables.</p>
<p>The following approaches were used in addressing the issue of missing data: (i) imputation by predictive mean matching (PMM), and (ii) removing missing data for non-categorical variables. In approach (ii), we labeled missing data for categorical variables as ‘unknown’ and removed the non-categorical observations with missing data. Variable selection and all other analysis was carried out using approach (ii), unless specified otherwise. We cross-validated our proposed predictive model using both approaches. When cross-validating our final predictive model with approach (ii), 17% of the data were removed.</p>
<sec id="sec004">
<title>Grouping categorical variables</title>
<p>In the data, some of the categorical variables have a large number of possible values. For example, the variable kidney diagnosis, has 75 different possible values. To avoid overfitting and large model variance, we used the approach described in <xref ref-type="supplementary-material" rid="pone.0209068.s012">S1 Text</xref> and illustrated in <xref ref-type="supplementary-material" rid="pone.0209068.s002">S2 Table</xref> to group different values of the variable together. The values grouped together have a similar effect on the hazard function, controlling for relevant variables. Following this approach, we decreased the number of different kidney diagnosis values from 75 to 8.</p>
</sec>
</sec>
</sec>
<sec id="sec005" sec-type="materials|methods">
<title>Methods</title>
<sec id="sec006">
<title>Variable selection</title>
<p>For variable selection, we first used the Breiman-Cutler permutation importance measure for random survival forests to rank the variables in order of variable importance [<xref ref-type="bibr" rid="pone.0209068.ref017">17</xref>]. Harrell’s concordance index was used to measure the error rate for assessing the decrease in accuracy when permuting each predictor variable in the permutation importance calculation.</p>
<p>Recipient age was ranked as the most important variable by permutation importance on the entire dataset. Hence, we decided to split the data into age-based cohorts and produced two separate rankings of variables, one ranking for older recipients and one for younger recipients. This allowed us to build two predictive models for the different cohorts. To find the split value for recipient age, we built 100 survival decision trees [<xref ref-type="bibr" rid="pone.0209068.ref018">18</xref>, <xref ref-type="bibr" rid="pone.0209068.ref019">19</xref>], each with one split using only recipient age. Each decision tree finds the recipient age that gives the best binary split of two groups based on parameters suggested by Strobl et al. [<xref ref-type="bibr" rid="pone.0209068.ref020">20</xref>]. The average split value for the 100 trees was 48.7 years. Hence, rounding up to 50, we performed variable selection separately for transplant recipients aged 50 and under (cohort 1), and recipients aged 51 and older (cohort 2). The average 5-year survival probabilities are 93% and 80% for cohorts 1 and 2, respectively, based on the Kaplan-Meier [<xref ref-type="bibr" rid="pone.0209068.ref021">21</xref>] estimate. Figs <xref ref-type="fig" rid="pone.0209068.g002">2</xref> and <xref ref-type="fig" rid="pone.0209068.g003">3</xref> depict the top ten variables for cohorts 1 and 2, respectively, based on random survival forests permutation importance.</p>
<fig id="pone.0209068.g002" position="float">
<object-id pub-id-type="doi">10.1371/journal.pone.0209068.g002</object-id>
<label>Fig 2</label>
<caption>
<title>Variable importance for recipients ages 50 and under based on Breiman-Cutler permutation importance.</title>
</caption>
<graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0209068.g002" xlink:type="simple"/>
</fig>
<fig id="pone.0209068.g003" position="float">
<object-id pub-id-type="doi">10.1371/journal.pone.0209068.g003</object-id>
<label>Fig 3</label>
<caption>
<title>Variable importance for recipients ages 51 and older based on Breiman-Cutler permutation importance.</title>
</caption>
<graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0209068.g003" xlink:type="simple"/>
</fig>
<p>We then used a Cox model regularized with the Lasso (L1) penalty to help determine how many of the top variables to select [<xref ref-type="bibr" rid="pone.0209068.ref022">22</xref>]. We used 10-fold cross-validation to determine the optimal Lasso penalty. <xref ref-type="fig" rid="pone.0209068.g004">Fig 4</xref> shows the number of nonzero coefficients for different penalty values for cohort 1. The top row represents the number of non-zero coefficients per different values of the Lasso penalty. The vertical line L0 corresponds to the optimal penalty, which minimizes the Partial Likelihood Deviance (PLD). The line Lσ corresponds to the largest penalty value corresponding to the PLD values within one standard deviation of the minimum PLD. <xref ref-type="supplementary-material" rid="pone.0209068.s014">S1 Fig</xref> gives the analogous results for cohort 2. To keep the predictive model simple and minimize the number of variables, we used the Lσ penalty, which has fewer nonzero coefficients than using L0.</p>
<fig id="pone.0209068.g004" position="float">
<object-id pub-id-type="doi">10.1371/journal.pone.0209068.g004</object-id>
<label>Fig 4</label>
<caption>
<title>Cox lasso variable selection for recipients ages 50 and under.</title>
<p>The top row represents the number of non-zero coefficients per Lasso penalty value, lambda. The vertical line L0 corresponds to the optimal penalty, which minimizes the PLD. The line Lσ corresponds to the largest penalty value corresponding to the PLD values within one standard deviation of the minimum PLD.</p>
</caption>
<graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0209068.g004" xlink:type="simple"/>
</fig>
<p>For each cohort, variables that have nonzero coefficients in the Lasso model and which are also among the top 20 variables chosen by permutation importance are included in the predictive model. <xref ref-type="table" rid="pone.0209068.t001">Table 1</xref> lists the final selections of variables for each cohort. <xref ref-type="supplementary-material" rid="pone.0209068.s003">S3 Table</xref> provides a description of the variables we used in our proposed predictive survival model. <xref ref-type="supplementary-material" rid="pone.0209068.s004">S4 Table</xref> gives the mean values from the data for numeric variables and the percentages of observations for each category for categorical variables.</p>
<table-wrap id="pone.0209068.t001" position="float">
<object-id pub-id-type="doi">10.1371/journal.pone.0209068.t001</object-id>
<label>Table 1</label> <caption><title>Variables in the proposed predictive model.</title></caption>
<alternatives>
<graphic id="pone.0209068.t001g" mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0209068.t001" xlink:type="simple"/>
<table>
<colgroup>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
</colgroup>
<thead>
<tr>
<th align="center">Cohort 1: Ages 50 and Under</th>
<th align="center">Cohort 2: Ages 51 and Older</th>
</tr>
</thead>
<tbody>
<tr>
<td align="center">AGE</td>
<td align="center">AGE</td>
</tr>
<tr>
<td align="center">COLD_ISCH_KI</td>
<td align="center">AGE_DON</td>
</tr>
<tr>
<td align="center">CREAT_TRR</td>
<td align="center">ANY_DIAL</td>
</tr>
<tr>
<td align="center">DEATH_MECH_DON</td>
<td align="center">COD_CAD_DON</td>
</tr>
<tr>
<td align="center">DIAB</td>
<td align="center">COLD_ISCH_KI</td>
</tr>
<tr>
<td align="center">DIAG_KI</td>
<td align="center">CREAT_TRR</td>
</tr>
<tr>
<td align="center">ETHCAT</td>
<td align="center">DEATH_MECH_DON</td>
</tr>
<tr>
<td align="center">FUNC_STAT_TRR</td>
<td align="center">DIAB</td>
</tr>
<tr>
<td align="center">HCV_SEROSTATUS</td>
<td align="center">DIAG_KI</td>
</tr>
<tr>
<td align="center">HIST_DIABETES_DON</td>
<td align="center">DRUGTRT_COPD</td>
</tr>
<tr>
<td align="center">HIST_HYPERTENS_DON</td>
<td align="center">ETHCAT</td>
</tr>
<tr>
<td align="center">MED_COND_TRR</td>
<td align="center">FUNC_STAT_TRR</td>
</tr>
<tr>
<td align="center">PAYMENTSOURCE_AT_TRANSPLANT</td>
<td align="center">HCV_SEROSTATUS</td>
</tr>
<tr>
<td align="center">REGION</td>
<td align="center">HIST_HYPERTENS_DON</td>
</tr>
</tbody>
</table>
</alternatives>
<table-wrap-foot>
<fn id="t001fn001"><p>A description of each variable is given in <xref ref-type="supplementary-material" rid="pone.0209068.s003">S3 Table</xref>.</p></fn>
</table-wrap-foot>
</table-wrap>
</sec>
<sec id="sec007">
<title>Predictive models</title>
<p>For cohort 1, we built a random survival forest model with conditional inference trees as base learners [<xref ref-type="bibr" rid="pone.0209068.ref018">18</xref>, <xref ref-type="bibr" rid="pone.0209068.ref019">19</xref>]. We grew a forest with 800 trees and four randomly selected variables considered for each split. Random forest parameters suggested by Strobl et al. [<xref ref-type="bibr" rid="pone.0209068.ref020">20</xref>] were used with a slight modification. We restricted a tree split to occur only if the splitting test statistic exceeded 0.3, instead of guaranteeing the inclusion of all splits. In testing, we found that this allowed the use of smaller trees with the same predictive performance measured by Harrell’s concordance index.</p>
<p>For cohort 2, the Cox proportional hazards model achieved a better concordance index than using random survival forests (0.664 vs. 0.655 based on 10 cross-validation samples of 80% training data and 20% out-of-sample data). Hence for cohort 2, we fit a Cox proportional hazards model. <xref ref-type="supplementary-material" rid="pone.0209068.s005">S5 Table</xref> shows the coefficients for the Cox model when it was trained on 100,000 observations.</p>
<p>In the proposed predictive model, we use the combination of random survival forests for cohort 1, and the Cox model for cohort 2. We evaluated the performance of the proposed model compared to other models by two metrics using cross-validation: (i) Harrell’s concordance index, and (ii) the integrated Brier score [<xref ref-type="bibr" rid="pone.0209068.ref023">23</xref>]. In addition to comparing the performance of our model to the reported performance of the EPTS model [<xref ref-type="bibr" rid="pone.0209068.ref002">2</xref>], we evaluated the EPTS model on the same data that we used for our model. We used PMM for missing data because the EPTS model does not allow for variable inputs to be unknown. We validated our proposed model in multiple ways, using PMM imputation and without imputation.</p>
<p>Our methodology for building the proposed predictive model is described by the following high-level summary:</p>
<list list-type="order">
<list-item><p>Identify important predictive variables by performing variable selection techniques such as Lasso or permutation importance.</p></list-item>
<list-item><p>Test the performance of multiple predictive models on the data using the variables identified in step 1. Use cross-validation and metrics such as the concordance index to evaluate the performance.</p></list-item>
<list-item><p>Determine the best binary split in the data using methods such as decision trees.</p></list-item>
<list-item><p>Repeat steps 1–3 for both subsets of the data a specified number of times. The final model consists of combining the predictions from the models that perform best on the different subsets of the data.</p></list-item>
</list>
</sec>
</sec>
<sec id="sec008" sec-type="results">
<title>Results</title>
<p><xref ref-type="table" rid="pone.0209068.t002">Table 2</xref> shows the 5-year Harrell’s concordance index and the integrated Brier score for the prosed model using 10 random samples of 80,000 training observations and 20,000 out-of-sample observations. It also reports the performance of a number of other models from the recent literature. Harrell’s 5-year concordance index for our proposed model is 0.724 versus 0.69 reported for the EPTS model [<xref ref-type="bibr" rid="pone.0209068.ref002">2</xref>] and 0.697 for the EPTS model applied to the data used for this study. The concordance index of the proposed model is 0.717 when we remove the donor variables and include only the recipient variables. This provides a more direct comparison to the EPTS model since the EPTS model does not use donor variables. The performance of the proposed model was nearly the same when we also validated it using PMM imputation as opposed to validation without imputation.</p>
<table-wrap id="pone.0209068.t002" position="float">
<object-id pub-id-type="doi">10.1371/journal.pone.0209068.t002</object-id>
<label>Table 2</label> <caption><title>Performance of the proposed predictive model compared to other models.</title></caption>
<alternatives>
<graphic id="pone.0209068.t002g" mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0209068.t002" xlink:type="simple"/>
<table>
<colgroup>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
</colgroup>
<thead>
<tr>
<th align="center">Model</th>
<th align="center">5-Year C-index</th>
<th align="center">5-Year Integrated Brier Score</th>
</tr>
</thead>
<tbody>
<tr>
<td align="center">LYFT Reported [<xref ref-type="bibr" rid="pone.0209068.ref004">4</xref>]</td>
<td align="center">0.680</td>
<td align="center">Not Reported</td>
</tr>
<tr>
<td align="center">EPTS Reported [<xref ref-type="bibr" rid="pone.0209068.ref002">2</xref>]</td>
<td align="center">0.69</td>
<td align="center">Not Reported</td>
</tr>
<tr>
<td align="center">EPTS Using the Same Cross-Validation Data as the Proposed Model</td>
<td align="center">0.697</td>
<td align="center">Not Calculated</td>
</tr>
<tr>
<td align="center">Li et al. [<xref ref-type="bibr" rid="pone.0209068.ref006">6</xref>] Reported</td>
<td align="center">0.700</td>
<td align="center">Not Reported</td>
</tr>
<tr>
<td align="center">Cox Model for Both Cohorts<xref ref-type="table-fn" rid="t002fn002">*</xref></td>
<td align="center">0.706</td>
<td align="center">0.063</td>
</tr>
<tr>
<td align="center">Random Forests for Both Cohorts<xref ref-type="table-fn" rid="t002fn002">*</xref></td>
<td align="center">0.718</td>
<td align="center">0.062</td>
</tr>
<tr>
<td align="center">Proposed Model without Donor Variables<xref ref-type="table-fn" rid="t002fn003">**</xref></td>
<td align="center">0.717</td>
<td align="center">0.060</td>
</tr>
<tr>
<td align="center">Proposed Model</td>
<td align="center">0.724</td>
<td align="center">0.061</td>
</tr>
<tr>
<td align="center">Proposed Model using PMM Imputation</td>
<td align="center">0.724</td>
<td align="center">0.060</td>
</tr>
</tbody>
</table>
</alternatives>
<table-wrap-foot>
<fn id="t002fn001"><p>Performance from 10 random samples of 80,000 training observations and 20,000 out-of-sample observations for all models except those marked ‘Reported’, where the metrics shown were provided in the literature for their respective models.</p></fn>
<fn id="t002fn002"><p>*These two predictive models used the variable selection techniques we used for each cohort separately but instead applied to all the data.</p></fn>
<fn id="t002fn003"><p>**Donor variables that were removed were: AGE_DON, COD_CAD_DON, COLD_ISCH_KI, DEATH_MECH_DON, HIST_DIABETES_DON, and HIST_HYPERTENS_DON.</p></fn>
</table-wrap-foot>
</table-wrap>
<p>Figs <xref ref-type="fig" rid="pone.0209068.g005">5</xref> and <xref ref-type="fig" rid="pone.0209068.g006">6</xref> illustrate the behavior of our proposed model trained using a random sample of 100,000 observations and validated on 25,000 out-of-sample observations. The solid lines represent the survival predictions and the dotted lines depict the observed Kaplan-Meier estimates for the out-of-sample observations. We also illustrate the model’s survival predictions for different values of its variables, holding the remaining variables constant, in <xref ref-type="supplementary-material" rid="pone.0209068.s015">S2 Fig</xref> (also see <xref ref-type="supplementary-material" rid="pone.0209068.s006">S6</xref> and <xref ref-type="supplementary-material" rid="pone.0209068.s007">S7</xref> Tables). <xref ref-type="supplementary-material" rid="pone.0209068.s008">S8</xref> and <xref ref-type="supplementary-material" rid="pone.0209068.s009">S9</xref> Tables present results on the performance of our proposed model at different numbers of days after transplantation and on different categories respectively. <xref ref-type="supplementary-material" rid="pone.0209068.s010">S10 Table</xref> gives results for additional tests on the performance of our proposed model and the EPTS model on data without pediatric recipients and living donors. <xref ref-type="supplementary-material" rid="pone.0209068.s011">S11 Table</xref> shows the performance of the proposed model compared to the EPTS model on the general population for each cross-validation sample.</p>
<fig id="pone.0209068.g005" position="float">
<object-id pub-id-type="doi">10.1371/journal.pone.0209068.g005</object-id>
<label>Fig 5</label>
<caption>
<title>Predicted survival of the proposed model.</title>
<p>Trained on 100,000 observations and validated on 25,000 out-of-sample observations. The survival curves are separated into 5 groups based on the predicted 5-year survival in the out-of-sample data.</p>
</caption>
<graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0209068.g005" xlink:type="simple"/>
</fig>
<fig id="pone.0209068.g006" position="float">
<object-id pub-id-type="doi">10.1371/journal.pone.0209068.g006</object-id>
<label>Fig 6</label>
<caption>
<title>Predicted survival of the proposed model for a ‘typical’ kidney transplant recipient.</title>
<p>Trained on 100,000 observations and validated on 25,000 out-of-sample observations. In the out-of-sample data, an observation is considered ‘typical’ if the values are within one standard deviation of the mean for recipient age, donor age, and cold ischemia time, and the most common values from the data for recipient diabetes, recipient dialysis status, recipient medical condition, and donor hypertension status.</p>
</caption>
<graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0209068.g006" xlink:type="simple"/>
</fig>
</sec>
<sec id="sec009" sec-type="conclusions">
<title>Discussion</title>
<p>The current kidney allocation system, adopted in 2013, matches the best 20% of kidneys as determined by the KDRI, to the top 20% of potential recipients with the highest predicted transplant survival probabilities, estimated by the EPTS model [<xref ref-type="bibr" rid="pone.0209068.ref012">12</xref>]. Improving the predictive performance of kidney transplant survival models can help the kidney allocation system more accurately rank potential recipients based on estimates of post-transplant survival. <xref ref-type="table" rid="pone.0209068.t002">Table 2</xref> shows that our proposed model has a higher concordance index than the EPTS model and other models recently published in the literature, such as the LYFT model and the flexible parametric model proposed by Li et al. [<xref ref-type="bibr" rid="pone.0209068.ref006">6</xref>]. Hence, when considering a random pair of candidates and determining which candidate in the pair has a higher post-transplant survival probability (in a given time frame, e.g., 5 years), our model will result in more correct pair rankings than the EPTS model, and has the potential to significantly improve the matching of organs to recipients. We also found that by using a model that combines different predictive models and variables for different age groups, we achieved better performance than by using the same model and variables for both cohorts.</p>
<p>A comparison of kidney transplant survival models over time shows a concordance index of 0.68 in 2009 for the LYFT model (Wolfe et al., 2009), a concordance index of 0.69 in 2013 for the EPTS model currently used in the kidney allocation system (Clayton et al., 2014), and an index of 0.70 in 2016 from Li et al. (2016). A gain in the index of 0.01 can have a dramatic impact considering that these models are used in the U.S. kidney allocation system, which is responsible for allocating tens of thousands of kidneys per year. Our model yields an improvement in the concordance index of 0.03 over the EPTS model when tested on the same data, which can have a significant impact on ranking kidney waitlist patients by their post-transplant survival more accurately.</p>
<p>Unlike the EPTS model, the proposed model has the flexibility to take into account characteristics of donors; hence, it can help predict which donor-recipient matching can result in the highest post-transplant survival, among several choices. The proposed model can also be used without the donor variables, and still result in a better concordance index than the EPTS model. This can be useful in estimating the survival of transplant recipients before the donor information is known, such as when determining recipient priority in the allocation system.</p>
<p>Our findings suggest that there may be a benefit for building separate models for different cohorts of patients (in this case cohorts separated by recipient age). For example, the variable region, was in the top ten ranked variables for cohort 1 but not for cohort 2. Hence, the impact of region on post-transplant survival is higher for cohort 1 than cohort 2.</p>
<p>The proposed model uses machine learning methods, and although it does not result in a simple equation to predict transplant survival, such methods are straightforward to apply. Further, the proposed model uses 18 different predictive variables versus 4 used by EPTS. While the model complexity could be viewed as a limitation, with the increasing power of computer tools, the model can easily be implemented in practice.</p>
</sec>
<sec id="sec010">
<title>Supporting information</title>
<supplementary-material id="pone.0209068.s001" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document" position="float" xlink:href="info:doi/10.1371/journal.pone.0209068.s001" xlink:type="simple">
<label>S1 Table</label>
<caption>
<title>Log-Rank test for differences in cohort survival.</title>
<p>χ2 statistic value = 259.3, <italic>p</italic>-value = 0.</p>
<p>(DOCX)</p>
</caption>
</supplementary-material>
<supplementary-material id="pone.0209068.s002" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document" position="float" xlink:href="info:doi/10.1371/journal.pone.0209068.s002" xlink:type="simple">
<label>S2 Table</label>
<caption>
<title>Original kidney diagnosis values and their new groupings.</title>
<p>We used the coefficients of a Cox model to group values with similar predicted transplant survival, controlling for other variables. We controlled for: recipient age, recipient diabetes, recipient cold ischemia time, recipient initial waitlist status, recipient ethnicity, donor age, donor cause of death, and donor living status. We considered putting the first three values of kidney diagnosis in S2 Table in its own group. However, they had fewer than 90 observations combined, which may cause overfitting issues.</p>
<p>(DOCX)</p>
</caption>
</supplementary-material>
<supplementary-material id="pone.0209068.s003" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document" position="float" xlink:href="info:doi/10.1371/journal.pone.0209068.s003" xlink:type="simple">
<label>S3 Table</label>
<caption>
<title>Descriptions of variables used in the proposed model.</title>
<p>*See <xref ref-type="supplementary-material" rid="pone.0209068.s002">S2 Table</xref> for variable values in this group.</p>
<p>(DOCX)</p>
</caption>
</supplementary-material>
<supplementary-material id="pone.0209068.s004" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document" position="float" xlink:href="info:doi/10.1371/journal.pone.0209068.s004" xlink:type="simple">
<label>S4 Table</label>
<caption>
<title>Summary of variables used in the predictive models.</title>
<p>The mean value of the data is given for numeric variables and the percentage of observations for each category is given for categorical variables. *See <xref ref-type="supplementary-material" rid="pone.0209068.s002">S2 Table</xref> for variable values in this group.</p>
<p>(DOCX)</p>
</caption>
</supplementary-material>
<supplementary-material id="pone.0209068.s005" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document" position="float" xlink:href="info:doi/10.1371/journal.pone.0209068.s005" xlink:type="simple">
<label>S5 Table</label>
<caption>
<title>Cox proportional hazards model coefficients for the proposed model.</title>
<p>Trained on a Random Sample of 100,000 observations.</p>
<p>(DOCX)</p>
</caption>
</supplementary-material>
<supplementary-material id="pone.0209068.s006" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document" position="float" xlink:href="info:doi/10.1371/journal.pone.0209068.s006" xlink:type="simple">
<label>S6 Table</label>
<caption>
<title>Variables held constant in <xref ref-type="supplementary-material" rid="pone.0209068.s015">S2 Fig</xref>.</title>
<p>*See <xref ref-type="supplementary-material" rid="pone.0209068.s002">S2 Table</xref> for variable values in this group.</p>
<p>(DOCX)</p>
</caption>
</supplementary-material>
<supplementary-material id="pone.0209068.s007" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document" position="float" xlink:href="info:doi/10.1371/journal.pone.0209068.s007" xlink:type="simple">
<label>S7 Table</label>
<caption>
<title>Factor level legend for <xref ref-type="supplementary-material" rid="pone.0209068.s015">S2 Fig</xref>.</title>
<p>*See <xref ref-type="supplementary-material" rid="pone.0209068.s002">S2 Table</xref> for variable values in this group.</p>
<p>(DOCX)</p>
</caption>
</supplementary-material>
<supplementary-material id="pone.0209068.s008" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document" position="float" xlink:href="info:doi/10.1371/journal.pone.0209068.s008" xlink:type="simple">
<label>S8 Table</label>
<caption>
<title>Concordance index at different days after transplant for the proposed model.</title>
<p>The performance is calculated from 10 random samples of 80,000 training observations and 20,000 out-of-sample observations.</p>
<p>(DOCX)</p>
</caption>
</supplementary-material>
<supplementary-material id="pone.0209068.s009" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document" position="float" xlink:href="info:doi/10.1371/journal.pone.0209068.s009" xlink:type="simple">
<label>S9 Table</label>
<caption>
<title>Proposed model performance by category.</title>
<p>Performance from a random sample of 100,000 training observations and 25,000 out-of-sample observations.</p>
<p>(DOCX)</p>
</caption>
</supplementary-material>
<supplementary-material id="pone.0209068.s010" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document" position="float" xlink:href="info:doi/10.1371/journal.pone.0209068.s010" xlink:type="simple">
<label>S10 Table</label>
<caption>
<title>Additional model testing.</title>
<p>10 random samples of 80,000 training observations and 20,000 out-of-sample observations. **Donor variables that were removed: AGE_DON, COD_CAD_DON, COLD_ISCH_KI, DEATH_MECH_DON, HIST_DIABETES_DON, and HIST_HYPERTENS_DON.</p>
<p>(DOCX)</p>
</caption>
</supplementary-material>
<supplementary-material id="pone.0209068.s011" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document" position="float" xlink:href="info:doi/10.1371/journal.pone.0209068.s011" xlink:type="simple">
<label>S11 Table</label>
<caption>
<title>Proposed model and EPTS model cross-validation results in <xref ref-type="table" rid="pone.0209068.t002">Table 2</xref>.</title>
<p>C-index based on 10 random samples of 80,000 training observations and 20,000 out-of-sample observations. Using a paired two sample Student's t-test, we reject the null hypothesis that the difference in model performance means is equal to 0 (p-value = 2.4x10<sup>-11</sup>). We also used a Shapiro-Wilk normality test and an F test for equality of variances to verify the assumptions of the t-test (Shapiro-Wilk p-value of 0.654 and 0.298 for the proposed model data and EPTS model data respectively; hence we don’t reject the null hypothesis of normally distributed model performance results. F test p-value of 0.605; hence we don’t reject the null hypothesis of equality of model performance variance).</p>
<p>(DOCX)</p>
</caption>
</supplementary-material>
<supplementary-material id="pone.0209068.s012" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document" position="float" xlink:href="info:doi/10.1371/journal.pone.0209068.s012" xlink:type="simple">
<label>S1 Text</label>
<caption>
<title>Grouping values for the variable kidney diagnosis.</title>
<p>(DOCX)</p>
</caption>
</supplementary-material>
<supplementary-material id="pone.0209068.s013" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document" position="float" xlink:href="info:doi/10.1371/journal.pone.0209068.s013" xlink:type="simple">
<label>S2 Text</label>
<caption>
<title>Software.</title>
<p>The analysis was undertaken using the statistical software R version 3.3.2 as well as several key packages listed in the references [<xref ref-type="bibr" rid="pone.0209068.ref024">24</xref>–<xref ref-type="bibr" rid="pone.0209068.ref030">30</xref>].</p>
<p>(DOCX)</p>
</caption>
</supplementary-material>
<supplementary-material id="pone.0209068.s014" mimetype="image/tiff" position="float" xlink:href="info:doi/10.1371/journal.pone.0209068.s014" xlink:type="simple">
<label>S1 Fig</label>
<caption>
<title>Lasso variable selection for recipients ages 51 and older.</title>
<p>(TIF)</p>
</caption>
</supplementary-material>
<supplementary-material id="pone.0209068.s015" mimetype="image/tiff" position="float" xlink:href="info:doi/10.1371/journal.pone.0209068.s015" xlink:type="simple">
<label>S2 Fig</label>
<caption>
<title>Proposed model’s 5-year survival predictions for different variable values.</title>
<p>In each plot, variable values not shown are held constant and listed in <xref ref-type="supplementary-material" rid="pone.0209068.s006">S6 Table</xref>. The model was trained on 100,000 random training observations.</p>
<p>(TIF)</p>
</caption>
</supplementary-material>
</sec>
</body>
<back>
<ack>
<p>We are grateful to the editors and referees for their constructive feedback and suggestions that helped improved this paper.</p>
</ack>
<ref-list>
<title>References</title>
<ref id="pone.0209068.ref001"><label>1</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Clayton</surname> <given-names>PA</given-names></name>, <name name-style="western"><surname>McDonald</surname> <given-names>SP</given-names></name>, <name name-style="western"><surname>Snyder</surname> <given-names>JJ</given-names></name>, <name name-style="western"><surname>Salkowski</surname> <given-names>N</given-names></name>, <name name-style="western"><surname>Chadban</surname> <given-names>SJ</given-names></name>. <article-title>External validation of the estimated posttransplant survival score for allocation of deceased donor kidneys in the United States</article-title>. <source>Am J Transplant</source>. <year>2014</year>;<volume>14</volume>(<issue>8</issue>):<fpage>1922</fpage>–<lpage>6</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1111/ajt.12761" xlink:type="simple">10.1111/ajt.12761</ext-link></comment> <object-id pub-id-type="pmid">24903739</object-id></mixed-citation></ref>
<ref id="pone.0209068.ref002"><label>2</label><mixed-citation publication-type="other" xlink:type="simple">A guide to calculating and interpreting the Estimated Post-Transplant Survival (EPTS) score used in the Kidney Allocation System (KAS). 2014. Available from: <ext-link ext-link-type="uri" xlink:href="https://optn.transplant.hrsa.gov/media/1511/guide_to_calculating_interpreting_epts.pdf" xlink:type="simple">https://optn.transplant.hrsa.gov/media/1511/guide_to_calculating_interpreting_epts.pdf</ext-link>.</mixed-citation></ref>
<ref id="pone.0209068.ref003"><label>3</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Baskin-Bey</surname> <given-names>ES</given-names></name>, <name name-style="western"><surname>Kremers</surname> <given-names>W</given-names></name>, <name name-style="western"><surname>Nyberg</surname> <given-names>SL</given-names></name>. <article-title>A recipient risk score for deceased donor renal allocation</article-title>. <source>Am J Kidney Dis</source>. <year>2007</year>;<volume>49</volume>(<issue>2</issue>):<fpage>284</fpage>–<lpage>93</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1053/j.ajkd.2006.10.018" xlink:type="simple">10.1053/j.ajkd.2006.10.018</ext-link></comment> <object-id pub-id-type="pmid">17261431</object-id></mixed-citation></ref>
<ref id="pone.0209068.ref004"><label>4</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Wolfe</surname> <given-names>RA</given-names></name>, <name name-style="western"><surname>McCullough</surname> <given-names>KP</given-names></name>, <name name-style="western"><surname>Leichtman</surname> <given-names>AB</given-names></name>. <article-title>Predictability of survival models for waiting list and transplant patients: calculating LYFT</article-title>. <source>Am J Transplant</source>. <year>2009</year>;<volume>9</volume>(<issue>7</issue>):<fpage>1523</fpage>–<lpage>7</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1111/j.1600-6143.2009.02708.x" xlink:type="simple">10.1111/j.1600-6143.2009.02708.x</ext-link></comment> <object-id pub-id-type="pmid">19656143</object-id></mixed-citation></ref>
<ref id="pone.0209068.ref005"><label>5</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Cox</surname> <given-names>DR</given-names></name>. <article-title>Regression models and life-tables</article-title>. <source>J R Stat Soc Series B Stat Methodol</source>. <year>1972</year>;<volume>34</volume>(<issue>2</issue>):<fpage>187</fpage>–<lpage>220</lpage>.</mixed-citation></ref>
<ref id="pone.0209068.ref006"><label>6</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Li</surname> <given-names>B</given-names></name>, <name name-style="western"><surname>Cairns</surname> <given-names>JA</given-names></name>, <name name-style="western"><surname>Robb</surname> <given-names>ML</given-names></name>, <name name-style="western"><surname>Johnson</surname> <given-names>RJ</given-names></name>, <name name-style="western"><surname>Watson</surname> <given-names>CJ</given-names></name>, <name name-style="western"><surname>Forsythe</surname> <given-names>JL</given-names></name>, <etal>et al</etal>. <article-title>Predicting patient survival after deceased donor kidney transplantation using flexible parametric modelling</article-title>. <source>BMC Nephrol</source>. <year>2016</year>;<volume>17</volume>:<fpage>51</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1186/s12882-016-0264-0" xlink:type="simple">10.1186/s12882-016-0264-0</ext-link></comment> <object-id pub-id-type="pmid">27225846</object-id></mixed-citation></ref>
<ref id="pone.0209068.ref007"><label>7</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Brown</surname> <given-names>TS</given-names></name>, <name name-style="western"><surname>Elster</surname> <given-names>EA</given-names></name>, <name name-style="western"><surname>Stevens</surname> <given-names>K</given-names></name>, <name name-style="western"><surname>Graybill</surname> <given-names>JC</given-names></name>, <name name-style="western"><surname>Gillern</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Phinney</surname> <given-names>S</given-names></name>, <etal>et al</etal>. <article-title>Bayesian modeling of pretransplant variables accurately predicts kidney graft survival</article-title>. <source>Am J Nephrol</source>. <year>2012</year>;<volume>36</volume>(<issue>6</issue>):<fpage>561</fpage>–<lpage>9</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1159/000345552" xlink:type="simple">10.1159/000345552</ext-link></comment> <object-id pub-id-type="pmid">23221105</object-id></mixed-citation></ref>
<ref id="pone.0209068.ref008"><label>8</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Harrell</surname> <given-names>FEJ</given-names></name>, <name name-style="western"><surname>Califf</surname> <given-names>RM</given-names></name>, <name name-style="western"><surname>Pryor</surname> <given-names>DB</given-names></name>, <name name-style="western"><surname>Lee</surname> <given-names>KL</given-names></name>, <name name-style="western"><surname>Rosati</surname> <given-names>RA</given-names></name>. <article-title>Evaluating the yield of medical tests</article-title>. <source>JAMA</source>. <year>1982</year>;<volume>247</volume>(<issue>18</issue>):<fpage>2543</fpage>–<lpage>6</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1001/jama.1982.03320430047030" xlink:type="simple">10.1001/jama.1982.03320430047030</ext-link></comment> <object-id pub-id-type="pmid">7069920</object-id></mixed-citation></ref>
<ref id="pone.0209068.ref009"><label>9</label><mixed-citation publication-type="other" xlink:type="simple">Organ Procurement and Transplantation Network. Data—OPTN. 2016. Available from: <ext-link ext-link-type="uri" xlink:href="https://optn.transplant.hrsa.gov/data/" xlink:type="simple">https://optn.transplant.hrsa.gov/data/</ext-link>.</mixed-citation></ref>
<ref id="pone.0209068.ref010"><label>10</label><mixed-citation publication-type="other" xlink:type="simple">United Network for Organ Sharing. Data—UNOS. 2016. Available from: <ext-link ext-link-type="uri" xlink:href="https://unos.org/data/" xlink:type="simple">https://unos.org/data/</ext-link>.</mixed-citation></ref>
<ref id="pone.0209068.ref011"><label>11</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Peto</surname> <given-names>R</given-names></name>, J. P. <article-title>Asymptotically efficient rank invariant test procedures</article-title>. <source>J R Stat Soc Ser A</source>. <year>1972</year>;<volume>135</volume>(<issue>2</issue>):<fpage>185</fpage>–<lpage>207</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.2307/2344317" xlink:type="simple">10.2307/2344317</ext-link></comment></mixed-citation></ref>
<ref id="pone.0209068.ref012"><label>12</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Rao</surname> <given-names>PS</given-names></name>, <name name-style="western"><surname>Schaubel</surname> <given-names>DE</given-names></name>, <name name-style="western"><surname>Guidinger</surname> <given-names>MK</given-names></name>, <name name-style="western"><surname>Andreoni</surname> <given-names>KA</given-names></name>, <name name-style="western"><surname>Wolfe</surname> <given-names>RA</given-names></name>, <name name-style="western"><surname>Merion</surname> <given-names>RM</given-names></name>, <etal>et al</etal>. <article-title>A comprehensive risk quantification score for deceased donor kidneys: the kidney donor risk index</article-title>. <source>Transplantation</source>. <year>2009</year>;<volume>88</volume>(<issue>2</issue>):<fpage>231</fpage>–<lpage>6</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1097/TP.0b013e3181ac620b" xlink:type="simple">10.1097/TP.0b013e3181ac620b</ext-link></comment> <object-id pub-id-type="pmid">19623019</object-id></mixed-citation></ref>
<ref id="pone.0209068.ref013"><label>13</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Krikov</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Khan</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Baird</surname> <given-names>BC</given-names></name>, <name name-style="western"><surname>Barenbaum</surname> <given-names>LL</given-names></name>, <name name-style="western"><surname>Leviatov</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Koford</surname> <given-names>JK</given-names></name>, <etal>et al</etal>. <article-title>Predicting kidney transplant survival using tree-based modeling</article-title>. <source>ASAIO J</source>. <year>2007</year>;<volume>53</volume>(<issue>5</issue>):<fpage>592</fpage>–<lpage>600</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1097/MAT.0b013e318145b9f7" xlink:type="simple">10.1097/MAT.0b013e318145b9f7</ext-link></comment> <object-id pub-id-type="pmid">17885333</object-id></mixed-citation></ref>
<ref id="pone.0209068.ref014"><label>14</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Kasiske</surname> <given-names>BL</given-names></name>, <name name-style="western"><surname>Israni</surname> <given-names>AK</given-names></name>, <name name-style="western"><surname>Snyder</surname> <given-names>JJ</given-names></name>, <name name-style="western"><surname>Skeans</surname> <given-names>MA</given-names></name>, <name name-style="western"><surname>Peng</surname> <given-names>Y</given-names></name>, <name name-style="western"><surname>ED</surname> <given-names>W</given-names></name>. <article-title>A simple tool to predict outcomes after kidney transplant</article-title>. <source>Am J Kidney Dis</source>. <year>2010</year>;<volume>56</volume>(<issue>5</issue>):<fpage>947</fpage>–<lpage>60</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1053/j.ajkd.2010.06.020" xlink:type="simple">10.1053/j.ajkd.2010.06.020</ext-link></comment> <object-id pub-id-type="pmid">20801565</object-id></mixed-citation></ref>
<ref id="pone.0209068.ref015"><label>15</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Chow</surname> <given-names>EKH</given-names></name>, <name name-style="western"><surname>Massie</surname> <given-names>AB</given-names></name>, <name name-style="western"><surname>Muzaale</surname> <given-names>AD</given-names></name>, <name name-style="western"><surname>Singer</surname> <given-names>AL</given-names></name>, <name name-style="western"><surname>Kucirka</surname> <given-names>LM</given-names></name>, <name name-style="western"><surname>Montgomery</surname> <given-names>RA</given-names></name>, <etal>et al</etal>. <article-title>Identifying appropriate recipients for CDC infectious risk donor kidneys</article-title>. <source>Am J Transplant</source>. <year>2013</year>;<volume>13</volume>(<issue>5</issue>):<fpage>1227</fpage>–<lpage>34</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1111/ajt.12206" xlink:type="simple">10.1111/ajt.12206</ext-link></comment> <object-id pub-id-type="pmid">23621162</object-id></mixed-citation></ref>
<ref id="pone.0209068.ref016"><label>16</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Wolfe</surname> <given-names>RA</given-names></name>, <name name-style="western"><surname>McCullough</surname> <given-names>KP</given-names></name>, <name name-style="western"><surname>Schaubel</surname> <given-names>DE</given-names></name>, <name name-style="western"><surname>Kalbfleisch</surname> <given-names>JD</given-names></name>, <name name-style="western"><surname>Murray</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Stegall</surname> <given-names>MD</given-names></name>, <etal>et al</etal>. <article-title>Calculating Life Years from Transplant (LYFT): Methods for kidney and kidney-pancreas candidates</article-title>. <source>Am J Transplant</source>. <year>2008</year>;<volume>8</volume>:<fpage>997</fpage>–<lpage>1011</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1111/j.1600-6143.2008.02177.x" xlink:type="simple">10.1111/j.1600-6143.2008.02177.x</ext-link></comment> <object-id pub-id-type="pmid">18336702</object-id></mixed-citation></ref>
<ref id="pone.0209068.ref017"><label>17</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Ishwaran</surname> <given-names>H.</given-names></name> <article-title>Variable importance in binary regression trees and forests</article-title>. <source>Electronic Journal of Statistics</source>. <year>2007</year>;<volume>1</volume>(<issue>0</issue>):<fpage>519</fpage>–<lpage>37</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1214/07-ejs039" xlink:type="simple">10.1214/07-ejs039</ext-link></comment></mixed-citation></ref>
<ref id="pone.0209068.ref018"><label>18</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Hothorn</surname> <given-names>T</given-names></name>, <name name-style="western"><surname>Lausen</surname> <given-names>B</given-names></name>, <name name-style="western"><surname>Benner</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Radespiel-Troger</surname> <given-names>M</given-names></name>. <article-title>Bagging survival trees</article-title>. <source>Stat Med</source>. <year>2004</year>;<volume>23</volume>(<issue>1</issue>):<fpage>77</fpage>–<lpage>91</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1002/sim.1593" xlink:type="simple">10.1002/sim.1593</ext-link></comment> <object-id pub-id-type="pmid">14695641</object-id></mixed-citation></ref>
<ref id="pone.0209068.ref019"><label>19</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Hothorn</surname> <given-names>T</given-names></name>, <name name-style="western"><surname>Hornik</surname> <given-names>K</given-names></name>, <name name-style="western"><surname>Zeileis</surname> <given-names>A</given-names></name>. <article-title>Unbiased recursive partitioning: A conditional inference framework</article-title>. <source>J Comput Graph Stat</source>. <year>2006</year>;<volume>15</volume>(<issue>3</issue>):<fpage>651</fpage>–<lpage>74</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1198/106186006X133933" xlink:type="simple">10.1198/106186006X133933</ext-link></comment></mixed-citation></ref>
<ref id="pone.0209068.ref020"><label>20</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Strobl</surname> <given-names>C</given-names></name>, <name name-style="western"><surname>Boulesteix</surname> <given-names>A-L</given-names></name>, <name name-style="western"><surname>Zeileis</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Hothorn</surname> <given-names>T</given-names></name>. <article-title>Bias in random forest variable importance measures: Illustrations, sources and a solution</article-title>. <source>BMC Bioinformatics</source>. <year>2007</year>;<fpage>8</fpage>–<lpage>25</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1186/1471-2105-8-8" xlink:type="simple">10.1186/1471-2105-8-8</ext-link></comment></mixed-citation></ref>
<ref id="pone.0209068.ref021"><label>21</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Kaplan</surname> <given-names>EL</given-names></name>, <name name-style="western"><surname>Meier</surname> <given-names>P</given-names></name>. <article-title>Nonparametric estimation from incomplete observations</article-title>. <source>J Am Stat Assoc</source>. <year>1958</year>;<volume>53</volume>(<issue>282</issue>):<fpage>457</fpage>–<lpage>81</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.2307/2281868" xlink:type="simple">10.2307/2281868</ext-link></comment></mixed-citation></ref>
<ref id="pone.0209068.ref022"><label>22</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Tibshirani</surname> <given-names>R.</given-names></name> <article-title>The Lasso Method for Variable Selection in the Cox Model</article-title>. <source>Stat Med</source>. <year>1997</year>;<volume>16</volume>:<fpage>385</fpage>–<lpage>95</lpage>. <object-id pub-id-type="pmid">9044528</object-id></mixed-citation></ref>
<ref id="pone.0209068.ref023"><label>23</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Graf</surname> <given-names>E</given-names></name>, <name name-style="western"><surname>Schmoor</surname> <given-names>C</given-names></name>, <name name-style="western"><surname>Sauerbrei W</surname> <given-names>SM</given-names></name>. <article-title>Assessment and comparison of prognostic classification schemes for survival data</article-title>. <source>Stat Med</source>. <year>1999</year>;<volume>18</volume>:<fpage>2529</fpage>–<lpage>45</lpage>. <object-id pub-id-type="pmid">10474158</object-id></mixed-citation></ref>
<ref id="pone.0209068.ref024"><label>24</label><mixed-citation publication-type="other" xlink:type="simple">R Core Team. R: A language and environment for statistical computing. 2016. Available from: <ext-link ext-link-type="uri" xlink:href="https://www.R-project.org/" xlink:type="simple">https://www.R-project.org/</ext-link>.</mixed-citation></ref>
<ref id="pone.0209068.ref025"><label>25</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Hothorn</surname> <given-names>T</given-names></name>, <name name-style="western"><surname>Buehlmann</surname> <given-names>P</given-names></name>, <name name-style="western"><surname>Dudoit</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Molinaro</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Van Der Laan</surname> <given-names>M</given-names></name>. <article-title>Survival ensembles</article-title>. <source>Biostatistics</source>. <year>2006</year>;<volume>7</volume>(<issue>3</issue>):<fpage>355</fpage>–<lpage>73</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/biostatistics/kxj011" xlink:type="simple">10.1093/biostatistics/kxj011</ext-link></comment> <object-id pub-id-type="pmid">16344280</object-id></mixed-citation></ref>
<ref id="pone.0209068.ref026"><label>26</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Ishwaran</surname> <given-names>H</given-names></name>, <name name-style="western"><surname>Kogalur</surname> <given-names>UB</given-names></name>. <source>Random forests for survival, regression and classification (RF-SRC)</source>. <year>2016</year>. Available from: <ext-link ext-link-type="uri" xlink:href="https://cran.r-project.org/package=randomForestSRC" xlink:type="simple">https://cran.r-project.org/package=randomForestSRC</ext-link>.</mixed-citation></ref>
<ref id="pone.0209068.ref027"><label>27</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Simon</surname> <given-names>N</given-names></name>, <name name-style="western"><surname>Friedman</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Hastie</surname> <given-names>T</given-names></name>, <name name-style="western"><surname>Tibshirani</surname> <given-names>R</given-names></name>. <article-title>Regularization paths for Cox's proportional hazards model via coordinate descent</article-title>. <source>J Stat Softw</source>. <year>2011</year>;<volume>39</volume>(<issue>5</issue>):<fpage>1</fpage>–<lpage>13</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.18637/jss.v039.i05" xlink:type="simple">10.18637/jss.v039.i05</ext-link></comment> <object-id pub-id-type="pmid">27065756</object-id></mixed-citation></ref>
<ref id="pone.0209068.ref028"><label>28</label><mixed-citation publication-type="other" xlink:type="simple">Therneau TM. A package for survival analysis in S. 2015. Available from: <ext-link ext-link-type="uri" xlink:href="http://CRAN.R-project.org/package=survival" xlink:type="simple">http://CRAN.R-project.org/package=survival</ext-link>.</mixed-citation></ref>
<ref id="pone.0209068.ref029"><label>29</label><mixed-citation publication-type="other" xlink:type="simple">Harrell Jr FE. Hmisc: Harrell miscellaneous. 2016. Available from: <ext-link ext-link-type="uri" xlink:href="https://CRAN.R-project.org/package=Hmisc" xlink:type="simple">https://CRAN.R-project.org/package=Hmisc</ext-link>.</mixed-citation></ref>
<ref id="pone.0209068.ref030"><label>30</label><mixed-citation publication-type="other" xlink:type="simple">Peters A, Hothorn T. Ipred: Improved predictors. 2015. Available from: <ext-link ext-link-type="uri" xlink:href="https://CRAN.R-project.org/package=ipred" xlink:type="simple">https://CRAN.R-project.org/package=ipred</ext-link>.</mixed-citation></ref>
</ref-list>
</back>
</article>