<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id><journal-id journal-id-type="publisher-id">jmir</journal-id><journal-id journal-id-type="index">1</journal-id><journal-title>Journal of Medical Internet Research</journal-title><abbrev-journal-title>J Med Internet Res</abbrev-journal-title><issn pub-type="epub">1438-8871</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v28i1e81424</article-id><article-id pub-id-type="doi">10.2196/81424</article-id><article-categories><subj-group subj-group-type="heading"><subject>Original Paper</subject></subj-group></article-categories><title-group><article-title>Time-Dynamic AI Models to Predict Quality of Life in Patients With Breast Cancer: Development and Validation Study Using the EORTC BALANCE Cohort</article-title></title-group><contrib-group><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Hubel</surname><given-names>Niclas J</given-names></name><degrees>MSc</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>van der Heijden</surname><given-names>Thijs G W</given-names></name><degrees>MSc</degrees><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Murauer</surname><given-names>Benjamin</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff3">3</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>de Rooij</surname><given-names>Belle H</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff4">4</xref><xref ref-type="aff" rid="aff5">5</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>de Ligt</surname><given-names>Kelly M</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Verkooijen</surname><given-names>Helena M</given-names></name><degrees>Prof Dr</degrees><xref ref-type="aff" rid="aff6">6</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Gernaat</surname><given-names>Sofie AM</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff6">6</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Hoedjes</surname><given-names>Meeke</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff7">7</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Arndt</surname><given-names>Volker</given-names></name><degrees>Prof Dr</degrees><xref ref-type="aff" rid="aff8">8</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>van de Poll-Franse</surname><given-names>Lonneke V</given-names></name><degrees>Prof Dr</degrees><xref ref-type="aff" rid="aff2">2</xref><xref ref-type="aff" rid="aff7">7</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Holzner</surname><given-names>Bernhard</given-names></name><degrees>Prof Dr</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff3">3</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Lehmann</surname><given-names>Jens</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff9">9</xref></contrib></contrib-group><aff id="aff1"><institution>Health Outcomes Research Unit, University Hospital of Psychiatry II, Medical University of Innsbruck</institution><addr-line>Anichstrasse 35</addr-line><addr-line>Innsbruck</addr-line><country>Austria</country></aff><aff id="aff2"><institution>Department of Psychosocial Research and Epidemiology, The Netherlands Cancer Institute</institution><addr-line>Amsterdam</addr-line><country>The Netherlands</country></aff><aff id="aff3"><institution>Evaluation Software Development GmbH</institution><addr-line>Innsbruck</addr-line><country>Austria</country></aff><aff id="aff4"><institution>Center of Research on Psychological Disorders and Somatic Diseases, Department of Medical and Clinical Psychology, Tilburg University</institution><addr-line>Tilburg</addr-line><country>The Netherlands</country></aff><aff id="aff5"><institution>Department of Research and Development, Netherlands Comprehensive Cancer Organisation (IKNL)</institution><addr-line>Utrecht</addr-line><country>The Netherlands</country></aff><aff id="aff6"><institution>Division of Imaging and Oncology, University Medical Centre Utrecht</institution><addr-line>Utrecht</addr-line><country>The Netherlands</country></aff><aff id="aff7"><institution>Center of Research on Psychological Disorders and Somatic Disorders, Department of Medical and Clinical Psychology, Tilburg University</institution><addr-line>Tilburg</addr-line><country>The Netherlands</country></aff><aff id="aff8"><institution>Cancer Survivorship Outcomes and Epidemiology, German Cancer Research Center (DKFZ)</institution><addr-line>Heidelberg</addr-line><country>Germany</country></aff><aff id="aff9"><institution>on behalf of the EORTC Quality of Life Group</institution></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Schwartz</surname><given-names>Amy</given-names></name></contrib><contrib contrib-type="editor"><name name-style="western"><surname>Balcarras</surname><given-names>Matthew</given-names></name></contrib><contrib contrib-type="editor"><name name-style="western"><surname>Cahill</surname><given-names>Naomi</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Bello</surname><given-names>Abdul-Waliyyu</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Shivanna</surname><given-names>Abhishek</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>zhu</surname><given-names>lichao</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Chakit</surname><given-names>Miloud</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Niclas J Hubel, MSc, Health Outcomes Research Unit, University Hospital of Psychiatry II, Medical University of Innsbruck, Anichstrasse 35, Innsbruck, 6020, Austria, 00 43 0 512 5042 3629; <email>niclas.hubel@i-med.ac.at</email></corresp></author-notes><pub-date pub-type="collection"><year>2026</year></pub-date><pub-date pub-type="epub"><day>30</day><month>4</month><year>2026</year></pub-date><volume>28</volume><elocation-id>e81424</elocation-id><history><date date-type="received"><day>18</day><month>08</month><year>2025</year></date><date date-type="rev-recd"><day>04</day><month>02</month><year>2026</year></date><date date-type="accepted"><day>04</day><month>02</month><year>2026</year></date></history><copyright-statement>&#x00A9; Niclas J Hubel, Thijs G W van der Heijden, Benjamin Murauer, Belle H de Rooij, Kelly M de Ligt, Helena M Verkooijen, Sofie AM Gernaat, Meeke Hoedjes, Volker Arndt, Lonneke V van de Poll-Franse, Bernhard Holzner, Jens Lehmann. Originally published in the Journal of Medical Internet Research (<ext-link ext-link-type="uri" xlink:href="https://www.jmir.org">https://www.jmir.org</ext-link>), 30.4.2026. </copyright-statement><copyright-year>2026</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research (ISSN 1438-8871), is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://www.jmir.org/">https://www.jmir.org/</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://www.jmir.org/2026/1/e81424"/><abstract><sec><title>Background</title><p>Patients with breast cancer often experience health-related quality of life (HRQoL) impairments that remain difficult to predict on an individual level. Prediction models can aid in understanding individual survivorship trajectories. However, current prognostic models are based on fixed intervals, limiting their utility in clinical follow-up schedules.</p></sec><sec><title>Objective</title><p>This study aimed to develop and externally validate time-dynamic machine learning (ML) models that predict clinically relevant HRQoL impairments in nonmetastatic patients with breast cancer.</p></sec><sec sec-type="methods"><title>Methods</title><p>Using the pooled multicohort EORTC (European Organisation for Research and Treatment of Cancer) BALANCE (big data in patients with breast cancer) dataset (n=6316) containing repeated HRQoL measurements (EORTC QLQ [Quality of Life Core Questionnaire]-C30), we constructed over 70,000 patient assessment pairs. ML algorithms were trained using the earlier HRQoL assessment and clinical data to predict dichotomized impairments in QLQ-C30 domains at the later assessment between 2 weeks and 5 years ahead, reflecting the range of follow-up intervals available in the dataset. The best performing model was determined via the area under the receiver operating characteristic curve in the internal validation, and externally validated in an independent cohort of the BALANCE dataset, in which the calibration and predictive performance in risk groups (patients: postmenopause, with financial difficulties, with obesity, with 2 or more comorbidities, with lower educational status, and with frailty) were also evaluated.</p></sec><sec sec-type="results"><title>Results</title><p>ML models showed good discrimination (area under the receiver operating characteristic curve 0.64&#x2010;0.84) across most domains, especially for persistent symptoms such as fatigue, financial difficulties, or functioning scales. Gradient boosting models performed best, but tended to be overconfident, with poor calibration for low-prevalence symptoms such as diarrhea or constipation. Model performance varied by risk group (eg, lower education and frailty), though no group consistently performed poorly. Performance remained stable across time windows, with prior HRQoL being the strongest predictor at the respective scale level, while clinical variables such as the type of treatment were less important for prediction.</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>Time-dynamic ML models can support personalized HRQoL prediction in breast cancer care. Future improvements should focus on calibration and fairness to enable equitable, clinically meaningful implementation.</p></sec></abstract><kwd-group><kwd>machine learning</kwd><kwd>health-related quality of life</kwd><kwd>HRQoL</kwd><kwd>breast cancer</kwd><kwd>prediction modeling</kwd><kwd>patient-reported outcomes</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>Breast cancer remains one of the most common malignancies among women worldwide, and although survival rates have improved significantly, many patients continue to experience long-term physical, emotional, and psychosocial consequences, stemming from both the disease and its treatment [<xref ref-type="bibr" rid="ref1">1</xref>]. These effects can have a profound impact on health-related quality of life (HRQoL) across survivorship trajectories [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref3">3</xref>]. Despite its clinical importance, clinicians often lack individualized insights into how HRQoL evolves across the cancer trajectory. This gap contributes to persistent unmet supportive care needs among patients with breast cancer, especially in the posttreatment phase [<xref ref-type="bibr" rid="ref4">4</xref>]. Without clear prognostic guidance on expected HRQoL changes, opportunities for patient-centered care and shared decision-making may be missed, potentially leading to suboptimal follow-up strategies and delayed interventions [<xref ref-type="bibr" rid="ref5">5</xref>].</p><p>Machine learning (ML) offers a promising avenue to address this gap when incorporating real-world data (RWD). Techniques such as deep learning and gradient boosting can uncover complex, nonlinear relationships within high-dimensional data and provide personalized HRQoL predictions [<xref ref-type="bibr" rid="ref6">6</xref>]. Existing ML models in breast cancer have largely focused on traditional clinical endpoints such as survival or recurrence [<xref ref-type="bibr" rid="ref7">7</xref>]. In contrast, HRQoL remains underexplored as an outcome, despite being, alongside overall survival, one of the top priorities for patients [<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref9">9</xref>].</p><p>However, several key challenges remain in applying ML to HRQoL prediction. First, structured, large-scale datasets capturing longitudinal HRQoL data are scarce [<xref ref-type="bibr" rid="ref7">7</xref>,<xref ref-type="bibr" rid="ref10">10</xref>]. In addition, existing datasets are highly heterogeneous: clinical trial data, RWD, and observational studies differ substantially in structure, completeness, and context. While integrating multiple data sources may enhance generalizability, it also introduces complex challenges related to data harmonization and standardization, making analyses more difficult [<xref ref-type="bibr" rid="ref11">11</xref>].</p><p>A further limitation of most existing models is their reliance on fixed prediction intervals. Typically, HRQoL is predicted at standardized time points, such as 6 or 12 months posttreatment, without accounting for variability in patients&#x2019; assessment schedules or individual disease trajectories [<xref ref-type="bibr" rid="ref7">7</xref>,<xref ref-type="bibr" rid="ref12">12</xref>-<xref ref-type="bibr" rid="ref15">15</xref>]. Yet in real-world practice, assessments often occur at irregular intervals shaped by patient needs and clinical routines. Static models thus fail to reflect the variability of patient journeys. Therefore, a time-dynamic prediction approach is warranted. Such a model would allow clinicians to predict HRQoL at any future point in time based on an individual&#x2019;s prior trajectory, time since last assessment, and current clinical context, supporting more timely and personalized decision-making.</p><p>Finally, ML models may inadvertently exacerbate disparities in care [<xref ref-type="bibr" rid="ref16">16</xref>-<xref ref-type="bibr" rid="ref18">18</xref>]. Demographic and socioeconomic differences in HRQoL reporting, combined with the underrepresentation of certain populations in training data, can lead to biased predictions and inequitable care [<xref ref-type="bibr" rid="ref17">17</xref>]. For example, models trained predominantly on data from phase III trials in high-income countries may underperform when applied to minority populations or patients in lower-resource settings, where symptom burden, health literacy, and reporting behaviors differ significantly [<xref ref-type="bibr" rid="ref19">19</xref>]. At present, however, it remains unclear to what extent HRQoL prediction models are affected by such biases, as empirical investigations into fairness or subgroup performance in this context are still scarce.</p><p>The present study aims to develop and validate time-dynamic ML models for predicting HRQoL in patients with nonmetastatic breast cancer from the BALANCE (big data in patients with breast cancer) cohort [<xref ref-type="bibr" rid="ref11">11</xref>]. We compare multiple ML algorithms against a baseline model and assess the impact of data heterogeneity on predictive performance. Moreover, we investigate the presence of algorithmic bias to advance fair, flexible, and clinically relevant HRQoL prediction tools for breast cancer care.</p></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Study Design</title><p>In this study, we developed and externally validated ML algorithms to predict clinically important impairment in HRQoL within multiple pooled datasets. We report our findings according to the TRIPOD (Transparent Reporting of a Multivariable Prediction Model for Individual Prognosis or Diagnosis) guidelines [<xref ref-type="bibr" rid="ref20">20</xref>] and the Guidelines for Developing and Reporting Machine Learning Predictive Models in Biomedical Research [<xref ref-type="bibr" rid="ref21">21</xref>].</p></sec><sec id="s2-2"><title>Ethical Considerations</title><p>Ethical approval for the secondary data analysis was obtained in 2022 at the Antoni van Leeuwenhoekziekenhuis/Nederlands Kanker Instituut from the institutional review board (IRBd22-179).</p><p>For the cohorts: ethical approval for the OPTIMUM (Towards Optimal Timing and Method for Promoting Sustained Adherence to Lifestyle and Body Weight Recommendations in Postmenopausal Breast Cancer Survivors) study was obtained from the Medical Research Ethics Committee Brabant, the Netherlands (NL66913.028.18). The VERDI (Verlauf der Diagnostischen Abkl&#x00E4;rung) study was approved by the ethics committees of the University of Heidelberg and the Medical Association of Saarland, Germany. Written informed consent was obtained from all participants. The study protocol for UMBRELLA (Utrecht Cohort for Multiple Breast Cancer Intervention Studies and Long-Term Evaluation) was approved by the Institutional Review and Ethics Board of the University Medical Center Utrecht, the Netherlands. No further compensation for the original participants was provided as their identity was not known to us. Patient data was processed only in pseudonymized form.</p></sec><sec id="s2-3"><title>Dataset</title><p>We described the data pooling previously in more detail [<xref ref-type="bibr" rid="ref11">11</xref>]. In brief, the BALANCE dataset comprises 6 cohorts with a total of 6316 female patients with nonmetastatic breast cancer, including trial data (EORTC [European Organisation for Research and Treatment of Cancer] AMAROS [After Mapping of the Axilla, Radiotherapy or Surgery?] [<xref ref-type="bibr" rid="ref22">22</xref>]), RWD (Netherlands Cancer Institute [NKI] [<xref ref-type="bibr" rid="ref23">23</xref>], district hospital Kufstein, Austria [<xref ref-type="bibr" rid="ref24">24</xref>]), and observational studies (UMBRELLA [<xref ref-type="bibr" rid="ref25">25</xref>], OPTIMUM [<xref ref-type="bibr" rid="ref26">26</xref>], and VERDI [<xref ref-type="bibr" rid="ref27">27</xref>]), with at least 2 HRQoL assessments (<xref ref-type="fig" rid="figure1">Figure 1</xref>). Data were collected between 2001 and 2024 and encompass patients receiving active treatment, follow-up, or survivorship care.</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>Patient flowchart. AMAROS: After Mapping of the Axilla, Radiotherapy or Surgery?; KUFSTEIN: District Hospital Kufstein cohort; NKI: Netherlands Cancer Institute; OPTIMUM: Towards Optimal Timing and Method for Promoting Sustained Adherence to Lifestyle and Body Weight Recommendations in Postmenopausal Breast Cancer Survivors; UMBRELLA: Utrecht Cohort for Multiple Breast Cancer Intervention Studies and Long-Term Evaluation; VERDI: Verlauf der Diagnostischen Abkl&#x00E4;rung.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="jmir_v28i1e81424_fig01.png"/></fig></sec><sec id="s2-4"><title>Data Preparation</title><p>Data cleaning and preprocessing were conducted using R (R Foundation) [<xref ref-type="bibr" rid="ref28">28</xref>], Jupyter Notebook, and Python (Python Software Foundation) libraries (Methods S1) in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> were used for statistical analyses and ML algorithms.</p><p>Features include patient characteristics and sociodemographics, comorbidities, disease and treatment parameters, as well as the items of the EORTC QLQ (Quality of Life Core Questionnaire)-C30 [<xref ref-type="bibr" rid="ref29">29</xref>] and breast cancer module QLQ-BR23 [<xref ref-type="bibr" rid="ref30">30</xref>]. Variables were either measured at the time of diagnosis or at the first HRQoL assessment. Cohort data were harmonized based on the common codebook (see Methods S2) in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. Briefly, time-related variables were coded in days since the date of diagnosis to ensure consistency across cohorts. Treatment characteristics were dichotomized into binary categories, and comorbidities were summarized as simple counts derived from available diagnostic information. Disease-related variables (eg, tumor stage and receptor status) were largely consistent across cohorts.</p><p>Features were preprocessed by one-hot encoding categorical variables (missing values were treated as distinct categories) to ensure they are represented numerically without implying an ordinal relationship and by normalizing all numeric features to 0 mean and unit variance to standardize their range, improving model performance and comparability. We removed features with 0 or near-0 variance (&#x003C;0.001) from the analysis and imputed missing feature values using the iterative imputer implementation from scikit-learn. It estimates missing values in an iterated round-robin fashion as a function of other features based on a Bayesian ridge estimator [<xref ref-type="bibr" rid="ref31">31</xref>].</p><p>To evaluate time-dynamic (ie, predicting HRQoL at every available time point using prior data and time since last assessment) predictive performance, for each patient, all possible combinations of their assessments were compiled into distinct pairs. Observations lacking either HRQoL data or the corresponding time point information were excluded. A new variable was introduced to represent the difference in days between the assessment dates within each pair. The outcome variable for each pair was defined as the value from the later assessment. For example (see Methods S3 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> for an illustration), if a patient had 3 assessments, A1, A2, and A3, occurring at different time points, pairs such as (A1, A2), (A1, A3), and (A2, A3) were generated. The earlier assessment in each pair contributed its single items to the dataset, while the later assessment provided the target outcome based on the dichotomized scales (see subsection Outcomes under the Methods section). No other data from the second assessment in each pair was included in the input features. Each pair (A<sub>m</sub>, A<sub>n</sub>) is represented as a training sample (X<sub>m</sub>, t<sub>m-n</sub>, Y<sub>n</sub>), where X<sub>m</sub> are the features of the assessment m, Y<sub>n</sub> is the binary outcome variable of the respective observation, and t<sub>m-n</sub> is the time difference between A<sub>m</sub> and A<sub>n</sub> in days. Each training sample can be interpreted as &#x201C;t<sub>m-n</sub> days after the patient has reported results X<sub>m</sub>, the patient&#x2019;s outcome is Y<sub>n</sub>.&#x201D; This approach allowed us to model changes in HRQoL over time. Figure S1 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> shows the distribution of the time difference between assessment pairs in the train and test set.</p></sec><sec id="s2-5"><title>Outcomes</title><p>HRQoL was measured with the EORTC QLQ-C30 before, during, or after treatment. Symptom (fatigue, nausea and vomiting, pain, dyspnea, insomnia, appetite loss [AP], constipation, diarrhea, and financial difficulties) and functioning scales (physical, role, emotional, cognitive, and social) are reported on a 4-point Likert scale (&#x201C;not at all,&#x201D; &#x201C;a bit,&#x201D; &#x201C;quite a bit,&#x201D; and &#x201C;very much&#x201D;) and transformed to linear scores ranging from 0 to 100 scale [<xref ref-type="bibr" rid="ref32">32</xref>]. We dichotomized the outcomes according to the established thresholds for clinical importance to indicate clinically relevant impairments, defined as scores associated with at least one of the following patient-reported concerns: limitations in daily life, need for help or care, and worries of the patient or their partner or family [<xref ref-type="bibr" rid="ref33">33</xref>]. The dichotomization simplifies clinical interpretation through established and meaningful thresholds.</p><p>We did not adjust the dataset for class imbalance as most outcome variables were balanced (see Results section), and adjusting for class imbalance would increase the risk for overfitting.</p></sec><sec id="s2-6"><title>Algorithms</title><p>We divided our dataset into model development data (5 cohorts) and external validation data (NKI). The NKI set was chosen as it contains the most current data from clinical practice and a sufficient number of patients.</p><p>We used the scikit-learn implementations of algorithms from multiple classifier families [<xref ref-type="bibr" rid="ref34">34</xref>] that proved effective in similar studies [<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref36">36</xref>]. We evaluated a logistic regression with L2 regularization, an extra-trees classifier, a multilayer perceptron classifier, and a histogram-based gradient boosting classification tree (see Methods S3 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> for a detailed description of libraries and GitHub for the code base). To account for the unequal contribution of patients with varying numbers of assessment pairs, we additionally incorporated sample weights inversely proportional to the number of pairs per patient. The final model was recalibrated using a probability calibration with logistic regression from scikit-learn (CalibratedClassifierCV, default settings) using a 5-fold cross-validation based on the training data. In addition, we performed post hoc recalibration on the external validation set to illustrate the extent to which context-specific adjustment can enhance model performance before deployment in a clinical setting.</p></sec><sec id="s2-7"><title>Evaluation</title><p>To assess model performance, we used internal cross-validation using a 5-fold (K=5) strategy. Given the differences in sample sizes across cohorts, the internal cross-validation was configured to keep the distribution of the cohorts within the train and test splits consistent. Thereby, the internal cross-validation was performed in a way that ensures an 80/20 train and test split and also prevents any patient overlap between train and test data.</p><p>Model performance was primarily evaluated using the area under the receiver operating characteristic curve (AUC), which is robust against class imbalance [<xref ref-type="bibr" rid="ref37">37</xref>]. Training with AUC can provide acceptable performance at a 1/10 imbalance ratio without rebalancing [<xref ref-type="bibr" rid="ref38">38</xref>]. Additional metrics included weighted <italic>F</italic><sub>1</sub>-score, accuracy, balanced accuracy, and confusion matrix metrics (sensitivity, specificity, positive predictive value, and negative predictive value) based on their scikit-learn implementation using the mean and SD from all internal cross-validation iterations [<xref ref-type="bibr" rid="ref34">34</xref>]. Accuracy reflects the overall proportion of correct predictions but can be misleading when classes are imbalanced. Balanced accuracy addresses this by averaging the recall obtained on each class, giving equal weight regardless of class frequency. The <italic>F</italic><sub>1</sub>-score summarizes overall classification performance by balancing false positives and false negatives, with the weighted <italic>F</italic><sub>1</sub>-score giving more weight to classes with more instances. Sensitivity (recall) quantifies the model&#x2019;s ability to correctly identify patients with an impairment, whereas specificity reflects the ability to correctly identify those without impairment. Positive predictive value indicates the probability that patients predicted to have an impairment truly experience it, while negative predictive value reflects the probability that patients predicted not to have an impairment are indeed unaffected. Higher scores indicate better overall model performance across all metrics [<xref ref-type="bibr" rid="ref39">39</xref>].</p><p>Last observation carried forward (LOCF) was used as a baseline for model comparison. LOCF serves as a straightforward method for estimating future values where patients&#x2019; HRQoL is not expected to change. These absolute values were used to compute AUC scores. It has been used in clinical trials and longitudinal studies as an imputation method or to predict future HRQoL [<xref ref-type="bibr" rid="ref40">40</xref>,<xref ref-type="bibr" rid="ref41">41</xref>]. Using this simple approach, therefore, provides a better baseline performance threshold compared to random chance (AUC=0.5). Furthermore, simplified logistic regression models with the prior HRQoL and the time difference as their only 2 predictors were computed to illustrate gains beyond LOCF.</p><p>Based on the internal cross-validation, we used the best-performing model for each target variable for external validation in the NKI dataset (<xref ref-type="fig" rid="figure1">Figure 1</xref>). Bootstrapping over 1000 iterations was used to estimate the stability of the external validation and LOCF, including 95% CIs [<xref ref-type="bibr" rid="ref42">42</xref>].</p><p>To interpret model predictions, we applied permutation feature importance, quantifying the contribution of each feature to the trained models. Model calibration was evaluated with calibration plots, the calibration plot&#x2019;s slope and intercept, and the expected calibration error (ECE), which assesses how closely predicted probabilities align with observed outcomes; good calibration is indicated by a calibration curve close to the diagonal, an intercept near zero, a slope approaching one, and a low ECE [<xref ref-type="bibr" rid="ref39">39</xref>,<xref ref-type="bibr" rid="ref43">43</xref>]. The ECE was based on a kernel-smoothed function using the relplot Python library [<xref ref-type="bibr" rid="ref44">44</xref>]. Additionally, the Brier score was computed to assess the overall performance, combining discrimination and calibration, with lower values near 0 representing better performance [<xref ref-type="bibr" rid="ref45">45</xref>].</p><p>Decision curve analyses were conducted to determine the clinical utility of the models [<xref ref-type="bibr" rid="ref46">46</xref>]. Predicted risks may inform patient counseling, leading to heterogeneous downstream actions, such as additional assessment, supportive care, or monitoring, which differ in burden and resource use and cannot be directly compared. Evaluating net benefit across a wide threshold range (ie, the predicted risk at which a clinician would consider acting), therefore, allows assessment of model utility under varying clinical preferences and use scenarios. In this framework, the treat-all and treat-none strategies represent reference scenarios in which all patients or no patients, respectively, are considered at risk. A model is considered to have clinical utility at threshold probabilities where its decision curve yields a higher net benefit than both reference strategies, indicating more favorable trade-offs between identifying patients at risk and the use of health care resources [<xref ref-type="bibr" rid="ref47">47</xref>].</p></sec><sec id="s2-8"><title>Model Fairness</title><p>In line with our aim of developing fair HRQoL prediction tools, and in accordance with recommendations to ensure equitable model performance across diverse populations [<xref ref-type="bibr" rid="ref16">16</xref>], we defined risk groups within the external validation dataset to address group fairness concerns. The following risk groups were selected based on prior literature [<xref ref-type="bibr" rid="ref48">48</xref>] and evaluated in the same manner as the full external dataset: (1) postmenopause, (2) financial difficulties (according to the thresholds for clinical importance for the financial difficulties scale [<xref ref-type="bibr" rid="ref33">33</xref>] at baseline), (3) obesity (BMI&#x2265;30), (4) 2 or more comorbidities, (5) lower educational status (secondary education or lower), and (6) frailty (scoring according to Murugappan et al [<xref ref-type="bibr" rid="ref49">49</xref>]). Additionally, to the previously described metrics, we evaluated true and false positive rates to screen for equalized odds disparities.</p></sec><sec id="s2-9"><title>Time-Dynamic Performance Evaluation</title><p>Further, we split the validation dataset to assess the impact of the time-dynamic aspect on model performance. As we are not relying on fixed prediction intervals, we want to ensure stable model performance across different time horizons. We evaluated long-term prediction defined as predicting outcomes more than 1 year in the future (t<sub>m-n</sub> larger than 365 days), as such predictions are especially valuable for informing survivorship care planning and long-term patient management. Further, we selected all outcome pairs from within the first year after diagnosis, as this period typically encompasses active treatment, during which most changes in HRQoL are expected to occur. After the first year, HRQoL tends to stabilize, making early assessment particularly relevant for capturing clinically meaningful variation [<xref ref-type="bibr" rid="ref50">50</xref>,<xref ref-type="bibr" rid="ref51">51</xref>].</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>Patient Characteristics</title><p>Outcome data from 6316 patients were initially acquired. After cleaning and preprocessing, 4491 patients remained in the model development dataset (<xref ref-type="fig" rid="figure1">Figure 1</xref>). <xref ref-type="table" rid="table1">Table 1</xref> shows their main characteristics across all included datasets.</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>Overview of datasets and patient characteristics at baseline. Only valid percentages are shown.</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Variable</td><td align="left" valign="bottom">Overall</td><td align="left" valign="bottom">Kufstein<sup><xref ref-type="table-fn" rid="table1fn1">a</xref></sup></td><td align="left" valign="bottom">UMBRELLA<sup><xref ref-type="table-fn" rid="table1fn2">b</xref></sup></td><td align="left" valign="bottom">OPTIMUM<sup><xref ref-type="table-fn" rid="table1fn3">c</xref></sup></td><td align="left" valign="bottom">VERDI<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup></td><td align="left" valign="bottom">AMAROS<sup><xref ref-type="table-fn" rid="table1fn5">e</xref></sup></td><td align="left" valign="bottom">NKI<sup><xref ref-type="table-fn" rid="table1fn6">f</xref></sup> (external)</td></tr></thead><tbody><tr><td align="left" valign="top">Value (n)</td><td align="left" valign="top">5101</td><td align="left" valign="top">96</td><td align="left" valign="top">2580</td><td align="left" valign="top">477</td><td align="left" valign="top">224</td><td align="left" valign="top">1114</td><td align="left" valign="top">610</td></tr><tr><td align="left" valign="top">RWD<sup><xref ref-type="table-fn" rid="table1fn7">g</xref></sup>, n (%)</td><td align="left" valign="top">3987 (78.2)</td><td align="left" valign="top">N/A<sup><xref ref-type="table-fn" rid="table1fn8">h</xref></sup></td><td align="left" valign="top">N/A</td><td align="left" valign="top">N/A</td><td align="left" valign="top">N/A</td><td align="left" valign="top">N/A</td><td align="left" valign="top">N/A</td></tr><tr><td align="left" valign="top">Country</td><td align="left" valign="top">N/A</td><td align="left" valign="top">Austria</td><td align="left" valign="top">Netherlands</td><td align="left" valign="top">Netherlands</td><td align="left" valign="top">Germany</td><td align="left" valign="top">Multiple<sup><xref ref-type="table-fn" rid="table1fn9">i</xref></sup></td><td align="left" valign="top">Netherlands</td></tr><tr><td align="left" valign="top">Assessment date in days since diagnosis, mean (SD)</td><td align="left" valign="top">265.93 (655.79)</td><td align="left" valign="top">57.02 (141.33)</td><td align="left" valign="top">361.33 (870.33)</td><td align="left" valign="top">367.07 (35.97)</td><td align="left" valign="top">667.80 (512.69)</td><td align="left" valign="top">54.51 (146.08)</td><td align="left" valign="top">54.72 (122.77)</td></tr><tr><td align="left" valign="top">Number of assessment pairs per patient, mean (SD)</td><td align="left" valign="top">4.62 (3.39)</td><td align="left" valign="top">11.6 (8.76)</td><td align="left" valign="top">5.38 (4.05)</td><td align="left" valign="top">2 (0)</td><td align="left" valign="top">2.81 (1.13)</td><td align="left" valign="top">5.30 (1.86)</td><td align="left" valign="top">2.06 (0.98)</td></tr><tr><td align="left" valign="top">Age (years), mean (SD)</td><td align="left" valign="top">56.70 (10.81)</td><td align="left" valign="top">56.83 (13.55)</td><td align="left" valign="top">55.91 (10.54)</td><td align="left" valign="top">65.33 (7.01)</td><td align="left" valign="top">56.10 (10.88)</td><td align="left" valign="top">55.94 (10.34)</td><td align="left" valign="top">54.92 (11.71)</td></tr><tr><td align="left" valign="top">Postmenopause, n (%)</td><td align="left" valign="top">1535 (67.8)</td><td align="left" valign="top">N/A</td><td align="left" valign="top">N/A</td><td align="left" valign="top">477 (100)</td><td align="left" valign="top">154 (68.8)</td><td align="left" valign="top">648 (58.9)</td><td align="left" valign="top">247 (56.1)</td></tr><tr><td align="left" valign="top">Marital status, n (%)</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Married or living together</td><td align="left" valign="top">1491 (64.2)</td><td align="left" valign="top">6 (54.5)</td><td align="left" valign="top">573 (54.5)</td><td align="left" valign="top">349 (74.7)</td><td align="left" valign="top">151 (67.4)</td><td align="left" valign="top">N/A</td><td align="left" valign="top">412 (72)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Relationship (not married or not living together)</td><td align="left" valign="top">196 (8.4)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">134 (12.7)</td><td align="left" valign="top">17 (3.6)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">N/A</td><td align="left" valign="top">45 (7.9)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Divorced or split up</td><td align="left" valign="top">306 (13.2)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">191 (18.2)</td><td align="left" valign="top">39 (8.4)</td><td align="left" valign="top">16 (7.1)</td><td align="left" valign="top">N/A</td><td align="left" valign="top">60 (10.5)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Widowed</td><td align="left" valign="top">193 (8.3)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">80 (7.6)</td><td align="left" valign="top">45 (9.6)</td><td align="left" valign="top">45 (20.1)</td><td align="left" valign="top">N/A</td><td align="left" valign="top">23 (4)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Never married or lived together</td><td align="left" valign="top">137 (5.9)</td><td align="left" valign="top">3 (27.3)</td><td align="left" valign="top">73 (6.9)</td><td align="left" valign="top">17 (3.6)</td><td align="left" valign="top">12 (5.4)</td><td align="left" valign="top">N/A</td><td align="left" valign="top">32 (5.6)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Marital status missing</td><td align="left" valign="top">2778</td><td align="left" valign="top">87</td><td align="left" valign="top">1529</td><td align="left" valign="top">10</td><td align="left" valign="top">0</td><td align="left" valign="top">1114</td><td align="left" valign="top">38</td></tr><tr><td align="left" valign="top">Education status, n (%)</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Primary education or lower</td><td align="left" valign="top">112 (3.4)</td><td align="left" valign="top">N/A</td><td align="left" valign="top">40 (2)</td><td align="left" valign="top">6 (1.3)</td><td align="left" valign="top">61 (27.2)</td><td align="left" valign="top">N/A</td><td align="left" valign="top">5 (0.9)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Secondary education</td><td align="left" valign="top">660 (20.2)</td><td align="left" valign="top">N/A</td><td align="left" valign="top">490 (24.5)</td><td align="left" valign="top">98 (21)</td><td align="left" valign="top">39 (17.4)</td><td align="left" valign="top">N/A</td><td align="left" valign="top">33 (5.7)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Vocational education</td><td align="left" valign="top">907 (27.8)</td><td align="left" valign="top">N/A</td><td align="left" valign="top">435 (21.8)</td><td align="left" valign="top">162 (34.7)</td><td align="left" valign="top">117 (52.2)</td><td align="left" valign="top">N/A</td><td align="left" valign="top">193 (33.6)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>University or higher (vocational) education</td><td align="left" valign="top">1586 (48.6)</td><td align="left" valign="top">N/A</td><td align="left" valign="top">1034 (51.7)</td><td align="left" valign="top">201 (43)</td><td align="left" valign="top">7 (3.1)</td><td align="left" valign="top">N/A</td><td align="left" valign="top">344 (59.8)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Education status missing</td><td align="left" valign="top">1836</td><td align="left" valign="top">96</td><td align="left" valign="top">581</td><td align="left" valign="top">10</td><td align="left" valign="top">0</td><td align="left" valign="top">1114</td><td align="left" valign="top">35</td></tr><tr><td align="left" valign="top">BMI, mean (SD)</td><td align="left" valign="top">25.98 (4.46)</td><td align="left" valign="top">25.20 (4.32)</td><td align="left" valign="top">N/A</td><td align="left" valign="top">26.05 (4.64)</td><td align="left" valign="top">26.03 (4.58)</td><td align="left" valign="top">25.94 (4.06)</td><td align="left" valign="top">26.10 (4.97)</td></tr><tr><td align="left" valign="top">Number of comorbidities, mean (SD)</td><td align="left" valign="top">1.73 (1.74)</td><td align="left" valign="top">0.33 (0.47)</td><td align="left" valign="top">N/A</td><td align="left" valign="top">2.48 (2.02)</td><td align="left" valign="top">2.25 (1.48)</td><td align="left" valign="top">N/A</td><td align="left" valign="top">1.13 (1.30)</td></tr><tr><td align="left" valign="top">Differentiation grade, n (%)</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Grade I</td><td align="left" valign="top">1176 (23.6)</td><td align="left" valign="top">7 (7.3)</td><td align="left" valign="top">668 (25.9)</td><td align="left" valign="top">102 (28.6)</td><td align="left" valign="top">17 (7.6)</td><td align="left" valign="top">276 (24.8)</td><td align="left" valign="top">106 (17.4)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Grade II</td><td align="left" valign="top">2239 (45)</td><td align="left" valign="top">39 (40.6)</td><td align="left" valign="top">1123 (43.5)</td><td align="left" valign="top">166 (46.5)</td><td align="left" valign="top">112 (50)</td><td align="left" valign="top">520 (46.7)</td><td align="left" valign="top">279 (45.7)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Grade III</td><td align="left" valign="top">1255 (25.2)</td><td align="left" valign="top">31 (32.3)</td><td align="left" valign="top">557 (21.6)</td><td align="left" valign="top">83 (23.2)</td><td align="left" valign="top">90 (40.2)</td><td align="left" valign="top">294 (26.4)</td><td align="left" valign="top">200 (32.8)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Grade IV</td><td align="left" valign="top">2 (0)</td><td align="left" valign="top">1 (1)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">1 (0.4)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">0 (0)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Grade unknown</td><td align="left" valign="top">307 (6.2)</td><td align="left" valign="top">17 (17.7)</td><td align="left" valign="top">232 (9)</td><td align="left" valign="top">6 (1.7)</td><td align="left" valign="top">4 (1.8)</td><td align="left" valign="top">24 (2.2)</td><td align="left" valign="top">24 (3.9)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Differentiation grade missing</td><td align="left" valign="top">120</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">120</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td></tr><tr><td align="left" valign="top">TNM<sup><xref ref-type="table-fn" rid="table1fn10">j</xref></sup> stage, n (%)</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>0</td><td align="left" valign="top">196 (4.1)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">196 (7.7)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">0 (0)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>IA</td><td align="left" valign="top">1903 (39.7)</td><td align="left" valign="top">27 (32.9)</td><td align="left" valign="top">1292 (51)</td><td align="left" valign="top">199 (64.6)</td><td align="left" valign="top">58 (33.9)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">327 (55.2)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>IB</td><td align="left" valign="top">135 (2.8)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">135 (5.3)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">0 (0)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>IIA</td><td align="left" valign="top">1772 (36.9)</td><td align="left" valign="top">37 (45.1)</td><td align="left" valign="top">543 (21.4)</td><td align="left" valign="top">70 (22.7)</td><td align="left" valign="top">63 (36.8)</td><td align="left" valign="top">898 (80.8)</td><td align="left" valign="top">161 (27.2)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>IIB</td><td align="left" valign="top">561 (11.7)</td><td align="left" valign="top">1 (1.2)</td><td align="left" valign="top">234 (9.2)</td><td align="left" valign="top">27 (8.8)</td><td align="left" valign="top">38 (22.2)</td><td align="left" valign="top">202 (18.2)</td><td align="left" valign="top">59 (10)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>IIIA</td><td align="left" valign="top">176 (3.7)</td><td align="left" valign="top">17 (20.7)</td><td align="left" valign="top">102 (4)</td><td align="left" valign="top">9 (2.9)</td><td align="left" valign="top">8 (4.7)</td><td align="left" valign="top">12 (1.1)</td><td align="left" valign="top">28 (4.7)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>IIIB</td><td align="left" valign="top">16 (0.3)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">5 (0.2)</td><td align="left" valign="top">2 (0.6)</td><td align="left" valign="top">4 (2.3)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">5 (0.8)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>IIIC</td><td align="left" valign="top">38 (0.8)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">25 (1)</td><td align="left" valign="top">1 (0.3)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">12 (2)</td></tr><tr><td align="left" valign="top">TNM stage missing, n (%)</td><td align="left" valign="top">304</td><td align="left" valign="top">14</td><td align="left" valign="top">48</td><td align="left" valign="top">169</td><td align="left" valign="top">53</td><td align="left" valign="top">2</td><td align="left" valign="top">18</td></tr><tr><td align="left" valign="top">ER<sup><xref ref-type="table-fn" rid="table1fn11">k</xref></sup> positive, n (%)</td><td align="left" valign="top">3049 (82.5)</td><td align="left" valign="top">N/A</td><td align="left" valign="top">2130 (83.5)</td><td align="left" valign="top">345 (86.7)</td><td align="left" valign="top">161 (77.8)</td><td align="left" valign="top">N/A</td><td align="left" valign="top">413 (76.3)</td></tr><tr><td align="left" valign="top">PR<sup><xref ref-type="table-fn" rid="table1fn12">l</xref></sup> positive, n (%)</td><td align="left" valign="top">2548 (69.1)</td><td align="left" valign="top">N/A</td><td align="left" valign="top">1828 (71.7)</td><td align="left" valign="top">260 (65.3)</td><td align="left" valign="top">148 (71.8)</td><td align="left" valign="top">N/A</td><td align="left" valign="top">312 (58.1)</td></tr><tr><td align="left" valign="top">HER2NEU<sup><xref ref-type="table-fn" rid="table1fn13">m</xref></sup> status, n (%)</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>0</td><td align="left" valign="top">2724 (59.6)</td><td align="left" valign="top">N/A</td><td align="left" valign="top">1439 (57)</td><td align="left" valign="top">238 (60.4)</td><td align="left" valign="top">N/A</td><td align="left" valign="top">1045 (93.9)</td><td align="left" valign="top">2 (0.4)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>1+</td><td align="left" valign="top">1020 (22.3)</td><td align="left" valign="top">N/A</td><td align="left" valign="top">739 (29.3)</td><td align="left" valign="top">126 (32)</td><td align="left" valign="top">N/A</td><td align="left" valign="top">68 (6.1)</td><td align="left" valign="top">87 (16.1)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>2+</td><td align="left" valign="top">458 (10)</td><td align="left" valign="top">N/A</td><td align="left" valign="top">3 (0.1)</td><td align="left" valign="top">2 (0.5)</td><td align="left" valign="top">N/A</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">453 (83.6)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>3+</td><td align="left" valign="top">372 (8.1)</td><td align="left" valign="top">N/A</td><td align="left" valign="top">344 (13.6)</td><td align="left" valign="top">28 (7.1)</td><td align="left" valign="top">N/A</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">0 (0)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>HER2NEU status missing</td><td align="left" valign="top">527</td><td align="left" valign="top">96</td><td align="left" valign="top">55</td><td align="left" valign="top">83</td><td align="left" valign="top">224</td><td align="left" valign="top"><sup><xref ref-type="table-fn" rid="table1fn9">i</xref></sup></td><td align="left" valign="top">68</td></tr><tr><td align="left" valign="top">Treatments, n (%)</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Surgery</td><td align="left" valign="top">4985 (98.4)</td><td align="left" valign="top">49 (51)</td><td align="left" valign="top">2572 (99.7)</td><td align="left" valign="top">440 (99.3)</td><td align="left" valign="top">223 (100)</td><td align="left" valign="top">1114 (100)</td><td align="left" valign="top">587 (96.2)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Radiotherapy</td><td align="left" valign="top">4206 (85.4)</td><td align="left" valign="top">1 (1.1)</td><td align="left" valign="top">2376 (92.1)</td><td align="left" valign="top">364 (91.5)</td><td align="left" valign="top">46 (34.8)</td><td align="left" valign="top">995 (89.3)</td><td align="left" valign="top">424 (69.5)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Chemotherapy</td><td align="left" valign="top">2779 (58.4)</td><td align="left" valign="top">94 (98.9)</td><td align="left" valign="top">1196 (46.4)</td><td align="left" valign="top">121 (78.1)</td><td align="left" valign="top">75 (36.1)</td><td align="left" valign="top">706 (63.4)</td><td align="left" valign="top">281 (46.1)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Hormonal therapy</td><td align="left" valign="top">2495 (59)</td><td align="left" valign="top">1 (1.2)</td><td align="left" valign="top">1304 (50.5)</td><td align="left" valign="top">218 (86.5)</td><td align="left" valign="top">75 (37.7)</td><td align="left" valign="top">897 (80.5)</td><td align="left" valign="top">N/A</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Immunotherapy</td><td align="left" valign="top">452 (74.1)</td><td align="left" valign="top">N/A</td><td align="left" valign="top">N/A</td><td align="left" valign="top">N/A</td><td align="left" valign="top">N/A</td><td align="left" valign="top">N/A</td><td align="left" valign="top">103 (17)</td></tr><tr><td align="left" valign="top">Frail, n (%)</td><td align="left" valign="top">346 (7.7)</td><td align="left" valign="top">9 (9.5)</td><td align="left" valign="top">293 (11.4)</td><td align="left" valign="top">16 (3.4)</td><td align="left" valign="top">3 (1.3)</td><td align="left" valign="top">25 (2.3)</td><td align="left" valign="top">33 (5.6)</td></tr><tr><td align="left" valign="top">Financial difficulties, n (%)</td><td align="left" valign="top">624 (12.2)</td><td align="left" valign="top">13 (13.5)</td><td align="left" valign="top">357 (13.8)</td><td align="left" valign="top">30 (6.3)</td><td align="left" valign="top">70 (31.2)</td><td align="left" valign="top">75 (6.7)</td><td align="left" valign="top">79 (13)</td></tr><tr><td align="left" valign="top">Obese, n (%)</td><td align="left" valign="top">291 (15.9)</td><td align="left" valign="top">13 (18.1)</td><td align="left" valign="top">N/A</td><td align="left" valign="top">76 (16.3)</td><td align="left" valign="top">51 (23.5)</td><td align="left" valign="top">151 (14.1)</td><td align="left" valign="top">107 (19.6)</td></tr><tr><td align="left" valign="top">Two comorbidities or more, n (%)</td><td align="left" valign="top">444 (55.7)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">N/A</td><td align="left" valign="top">298 (62.5)</td><td align="left" valign="top">146 (65.2)</td><td align="left" valign="top">N/A</td><td align="left" valign="top">173 (30)</td></tr><tr><td align="left" valign="top">Lower education status, n (%)</td><td align="left" valign="top">734 (27.3)</td><td align="left" valign="top">N/A</td><td align="left" valign="top">530 (26.5)</td><td align="left" valign="top">104 (22.3)</td><td align="left" valign="top">100 (44.6)</td><td align="left" valign="top">N/A</td><td align="left" valign="top">38 (6.6)</td></tr></tbody></table><table-wrap-foot><fn id="table1fn1"><p><sup>a</sup>Kufstein: District Hospital Kufstein cohort. </p></fn><fn id="table1fn2"><p><sup>b</sup>UMBRELLA: Utrecht Cohort for Multiple Breast Cancer Intervention Studies and Long-Term Evaluation. </p></fn><fn id="table1fn3"><p><sup>c</sup>OPTIMUM: Towards Optimal Timing and Method for Promoting Sustained Adherence to Lifestyle and Body Weight Recommendations in Postmenopausal Breast Cancer Survivors.</p></fn><fn id="table1fn4"><p><sup>d</sup>VERDI: Verlauf der Diagnostischen Abklaerung.</p></fn><fn id="table1fn5"><p><sup>e</sup>AMAROS: After Mapping of the Axilla, Radiotherapy or Surgery?</p></fn><fn id="table1fn6"><p><sup>f</sup>NKI: Netherlands Cancer Institute. </p></fn><fn id="table1fn7"><p><sup>g</sup>RWD: real world data. </p></fn><fn id="table1fn8"><p><sup>h</sup>N/A: not applicable.</p></fn><fn id="table1fn9"><p><sup>i</sup>France, Israel, Italy, Netherlands, Slovenia, Switzerland, Turkey, and United Kingdom.</p></fn><fn id="table1fn10"><p><sup>j</sup>TNM: tumor, nodes, metastasis.</p></fn><fn id="table1fn11"><p><sup>k</sup>ER: estrogen receptor.</p></fn><fn id="table1fn12"><p><sup>l</sup>PR: progesterone receptor.</p></fn><fn id="table1fn13"><p><sup>m</sup>HER2NEU: Human Epidermal Growth Factor Receptor 2 Neural.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s3-2"><title>Outcomes</title><p>The outcome distribution in the development and validation sets after pairing HRQoL assessments showed a higher prevalence of impairments to HRQoL in the external validation set across all domains compared to the training set (<xref ref-type="table" rid="table2">Table 2</xref>). Major class imbalance (ratio of event to total number of less than 1/10) occurred in 3/14 scales (AP, constipation, and social functioning) in the training set. The event rates were higher in the external validation set.</p><table-wrap id="t2" position="float"><label>Table 2.</label><caption><p>Outcome distribution (number of assessments with respective impairments) of the EORTC C30<sup><xref ref-type="table-fn" rid="table2fn1">a</xref></sup> scales in the training and validation set.</p></caption><table id="table2" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom"/><td align="left" valign="bottom">Training set (n=69,777)</td><td align="left" valign="bottom">External validation set (n=2520)</td></tr></thead><tbody><tr><td align="left" valign="bottom">EORTC QLQ-C30 scale<sup><xref ref-type="table-fn" rid="table2fn2">b</xref></sup></td><td align="left" valign="bottom">Assessments with impairments (events)<sup><xref ref-type="table-fn" rid="table2fn3">c</xref></sup>, n (%)</td><td align="left" valign="bottom">Assessments with impairments (events)<sup><xref ref-type="table-fn" rid="table2fn3">c</xref></sup>, n (%)</td></tr><tr><td align="left" valign="bottom">Physical functioning (PF2)</td><td align="left" valign="bottom">18,261 (26.2)</td><td align="left" valign="bottom">754 (29.9)</td></tr><tr><td align="left" valign="bottom">Role functioning (RF2)</td><td align="left" valign="bottom">9099 (13)</td><td align="left" valign="bottom">555 (22)</td></tr><tr><td align="left" valign="bottom">Emotional functioning (EF)</td><td align="left" valign="bottom">16,046 (23)</td><td align="left" valign="bottom">1051 (41.7)</td></tr><tr><td align="left" valign="bottom">Cognitive functioning (CF)</td><td align="left" valign="bottom">20,093 (28.8)</td><td align="left" valign="bottom">942 (37.4)</td></tr><tr><td align="left" valign="bottom">Social functioning (SF)</td><td align="left" valign="bottom">5195 (7.4)</td><td align="left" valign="bottom">432 (17.1)</td></tr><tr><td align="left" valign="bottom">Fatigue (FA)</td><td align="left" valign="bottom">14,213 (20.4)</td><td align="left" valign="bottom">794 (31.5)</td></tr><tr><td align="left" valign="top">Nausea and vomiting (NV)</td><td align="left" valign="top">9565 (13.7)</td><td align="left" valign="top">520 (20.6)</td></tr><tr><td align="left" valign="top">Pain (PA)</td><td align="left" valign="top">19,216 (27.5)</td><td align="left" valign="top">982 (39)</td></tr><tr><td align="left" valign="top">Dyspnea (DY)</td><td align="left" valign="top">19,894 (28.5)</td><td align="left" valign="top">858 (34)</td></tr><tr><td align="left" valign="top">Insomnia (SL)</td><td align="left" valign="top">12,245 (17.5)</td><td align="left" valign="top">605 (24)</td></tr><tr><td align="left" valign="top">Appetite loss (AP)</td><td align="left" valign="top">2091 (3)</td><td align="left" valign="top">124 (4.9)</td></tr><tr><td align="left" valign="top">Constipation (CO)</td><td align="left" valign="top">3414 (4.9)</td><td align="left" valign="top">156 (6.2)</td></tr><tr><td align="left" valign="top">Diarrhea (DI)</td><td align="left" valign="top">9652 (13.8)</td><td align="left" valign="top">559 (22.2)</td></tr><tr><td align="left" valign="top">Financial difficulties (FI)</td><td align="left" valign="top">7833 (11.2)</td><td align="left" valign="top">435 (17.3)</td></tr></tbody></table><table-wrap-foot><fn id="table2fn1"><p><sup>a</sup>EORTC QLQ-C30: European Organisation for Research and Treatment of Cancer Quality of Life Questionnaire Core 30.</p></fn><fn id="table2fn2"><p><sup>b</sup>The global health status scale was not analyzed as there is no published threshold available.</p></fn><fn id="table2fn3"><p><sup>c</sup>Events defined as scores below the thresholds for clinical importance indicate clinically relevant impairments according to Giesinger et al [<xref ref-type="bibr" rid="ref33">33</xref>].</p></fn></table-wrap-foot></table-wrap></sec><sec id="s3-3"><title>Model Development and Internal Validation</title><p><xref ref-type="fig" rid="figure2">Figure 2A</xref> illustrates the performance of the logistic regression, extra-trees classifier, multilayer perceptron classifier, and a histogram-based gradient boosting classification tree for the prediction of impaired HRQoL at the next available assessment. Across all evaluated QLQ-C30 domains, the histogram-based gradient boosting classification tree showed the highest AUC, and all algorithms outperformed the LOCF baseline (<xref ref-type="fig" rid="figure2">Figure 2B</xref>). AUC values for the baseline regression models lay between 0.648 (95% CI 0.616&#x2010;0.679; pain) and 0.829 (95% CI 0.767&#x2010;0.884; AP), see <xref ref-type="fig" rid="figure2">Figure 2B</xref> for a comparison. A comprehensive list of evaluation metrics can be found in Table S1 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p><p>From all QLQ-C30 domains, functional scales had a higher AUC than single-item symptom scales (dyspnea, insomnia, AP, constipation, and diarrhea). Except for financial difficulties, which showed the highest AUC overall (0.861, SD 0.009).</p><fig position="float" id="figure2"><label>Figure 2.</label><caption><p>Evaluation of models trained to predict impairments in HRQoL. Error bars: SD, for LOCF and external validation: 95% CI. Full data available in Tables S1 and S2 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. HRQoL: health-related quality of life; LOCF: last observation carried forward; ROC AUC: area under the receiver operating characteristic curve.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="jmir_v28i1e81424_fig02.png"/></fig></sec><sec id="s3-4"><title>External Validation</title><p>The external validation with the NKI yielded good discriminatory ability (<xref ref-type="fig" rid="figure2">Figure 2B</xref> and Table S2 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). The highest AUC (0.837, 95% CI 0.809, 0.864) could be observed in the financial difficulties scale, whereas the diarrhea scale yielded the lowest AUC (0.643, 95% CI 0.600, 0.689).</p><p>Model calibration varied between the scales (Figure S2) in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. We observed the worst calibration in the single-item symptom scales (AP, constipation, and diarrhea), better calibration in the functioning scales, and the best calibration in fatigue and physical functioning. Generally, models for scales containing more items were better calibrated. Calibration slopes were below the ideal value of 1 for all models (Table S2) in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>, ranging from 0.089 (constipation; 95% CI 0.063, 0.116) to 0.286 (fatigue; 95% CI 0.259, 0.313), indicating overconfident predictions. Post hoc recalibration improved discrimination (AUCs 0.975&#x2010;0.995) as well as calibration based on visual inspection (Table S5 and Figure S3) in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p><p>Across all domain models, the individual HRQoL items from the previous assessment, the time of assessment, and treatment start dates were among the most important features (Figure S4) in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. The type of treatment, other clinical variables, and diagnostic characteristics or comorbidities had little influence on the models&#x2019; performance.</p><p>Decision curves are shown in Figure S5 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>, and most models (exceptions: social functioning, AP, and diarrhea) proved to be superior compared to a &#x201C;treat all&#x201D; scenario for risk thresholds between 0.2 and 0.6.</p></sec><sec id="s3-5"><title>Model Fairness</title><p>The proportion of events in the risk groups was almost always higher than in the external validation set (Table S3) in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. <xref ref-type="fig" rid="figure3">Figure 3A</xref> illustrates model performance in risk groups selected from the external validation set in comparison with the whole set (see Table S3 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> for risk group distributions).</p><fig position="float" id="figure3"><label>Figure 3.</label><caption><p>Model performance in risk groups and time-dynamic performance compared to the external validation. For (B) after diagnosis: all assessments within the first year after diagnosis; future assessment: all assessments more than 1 year in the future. Full data available in Table S4 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. ROC AUC: area under the receiver operating characteristic curve.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="jmir_v28i1e81424_fig03.png"/></fig><p>The discrimination power within risk groups varied between domains, depending on specific risk group-scale combinations (Table S4) in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. The lower education status risk group showed the highest (financial difficulties: 0.897, 95% CI 0.825, 0.956) as well as the lowest (nausea and vomiting: 0.473, 95% CI 0.314, 0.633) AUC over all.</p><p>In the postmenopausal and obese risk groups, AUC CIs consistently overlapped with those of the full dataset, indicating similar model performance. This was largely consistent for other risk groups, except for the following cases: multiple comorbidities (pain and dyspnea), financial difficulties, frailty (AP and role functioning), and lower educational status (nausea and vomiting, and constipation), where reduced performance was observed.</p><p>Additionally, the predictive performance differed within some scales more than in others. For instance, in the pain scale, the AUCs were relatively homogenous, whereas the constipation scale had a high variability in AUCs. Model calibration was poor with calibration slopes across all targets and risk groups below the ideal value of 1 (Table S4) in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. Due to the low number of events, we could not evaluate the calibration plots.</p></sec><sec id="s3-6"><title>Time-Dynamic Performance</title><p>We observed little impact of the time-dynamic aspect on model performance (<xref ref-type="fig" rid="figure3">Figure 3B</xref>). The prediction within the first year after diagnosis showed similar AUCs compared to the whole external dataset, with differences below 0.01 (Table S4) in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. Long-term prediction showed slightly higher AUCs in 9 of 14 cases and the greatest deterioration in role functioning (0.032).</p></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Principal Findings</title><p>This study developed the first time-dynamic machine ML model for predicting impaired HRQoL in patients with early breast cancer, using multiple cohorts from different countries and settings. The ML-based prediction models consistently outperformed LOCF and the regression baseline in 10/14 cases, with the histogram-based gradient boosting classification tree showing the best performance. The best calibration was seen in multi-item scales; however, predictions were overconfident in all domains. We introduce a novel approach to time-dynamic HRQoL prediction, enabling flexible predictions beyond fixed time points. This addresses the issue with current static models, as they cannot capture the variability of real-world HRQoL assessment schedules. It therefore allows the early detection of meaningful HRQoL impairments throughout a patient&#x2019;s course of disease and provides clinicians with a tool to guide targeted interventions. Model fairness analyses revealed variation in model performance across risk groups, depending on individual domain and group combinations.</p></sec><sec id="s4-2"><title>Model Evaluation and External Validation</title><p>Overall, our models demonstrated good discriminatory performance across most HRQoL domains; however, calibration was inconsistent, particularly for scales with low outcome prevalence. Discrimination, reflected in AUC values exceeding 0.75 [<xref ref-type="bibr" rid="ref52">52</xref>], was generally strong, confirming that the models effectively distinguished between patients with impaired HRQoL and those without. This is within the range of comparable studies, most of which used internal k-fold cross-validation (see Krepper et al [<xref ref-type="bibr" rid="ref12">12</xref>] for an overview). Yet, for some outcomes (especially AP, constipation, and diarrhea) predicted probabilities did not consistently align with observed event rates (ie, poor calibration), limiting the clinical reliability of the models in those domains.</p><p>Accurate predictions, based on both strong discrimination and acceptable calibration, were observed for key domains such as physical, emotional, and cognitive functioning, as well as fatigue, pain, and financial difficulties. These domains might reflect more persistent problems, likely contributing to the robustness of the predictive models [<xref ref-type="bibr" rid="ref53">53</xref>,<xref ref-type="bibr" rid="ref54">54</xref>]. In contrast, models struggled to predict transient or low-prevalence symptoms, including diarrhea, nausea and vomiting, and constipation. These limitations reflect both the nature of the symptoms, often short-lived and influenced by acute factors [<xref ref-type="bibr" rid="ref55">55</xref>], and the statistical challenges of modeling rare outcomes [<xref ref-type="bibr" rid="ref39">39</xref>]. The poor calibration in these domains can be attributed to the class imbalance and the insufficient total number of events. In our external dataset, some of these outcomes (AP and constipation) occurred fewer than 200 times, a known threshold below which reliable calibration curves become difficult to estimate [<xref ref-type="bibr" rid="ref43">43</xref>], while also corresponding to less than 10% of all observations. Here, ensemble methods such as random forests and gradient boosting tend to struggle, often underestimating probabilities at the extremes due to their inherent smoothing behavior [<xref ref-type="bibr" rid="ref56">56</xref>]. This happens because averaging predictions from many noisy base models pulls extreme values toward the center, making it difficult to produce confident predictions near 0 or 1.</p><p>To address these limitations, we recalibrated the models using data from the specific clinical setting where they could be applied, thereby adjusting for local outcome prevalence and population characteristics. We highlighted the impact of this approach in a supplementary analysis, which improved model performance drastically.</p><p>Another potential approach is upsampling the training data to balance class distributions, which showed improved calibration when using HRQoL to predict clinical events [<xref ref-type="bibr" rid="ref36">36</xref>]. However, this does not reflect real-world incidence rates and may distort probability calibration without improving model performance in cases with an adequate number of events. Notably, similar challenges have been reported in other HRQoL modeling efforts: for example, Adiprakoso et al [<xref ref-type="bibr" rid="ref35">35</xref>] observed good discrimination but suboptimal calibration when predicting fatigue in patients with cancer, reinforcing the need for careful evaluation of both performance dimensions.</p><p>Despite these issues, this study adds to the growing body of literature emphasizing the value of external validation, a step still rarely undertaken in HRQoL modeling despite TRIPOD guidelines recommending distinct datasets for model evaluation [<xref ref-type="bibr" rid="ref20">20</xref>].</p><p>In line with previous research [<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref57">57</xref>-<xref ref-type="bibr" rid="ref59">59</xref>], prior HRQoL was consistently among the most important predictors across all models, even over longer periods of time. Temporal variables, such as treatment start and stop dates and the timing of HRQoL assessment, also ranked highly. This was also reflected in the competitive performance of the baseline model, which included only prior HRQoL and the time between assessments. In contrast, neither specific treatment types nor clinical variables (eg, tumor stage) appeared influential for predicting the general functioning and symptom domains of the QLQ-C30. This suggests that, for broad HRQoL outcomes, being on or off treatment may matter more than which specific treatment is received. These patterns may differ for treatment-specific side effects not captured by the QLQ-C30 (eg, skin problems for new targeted agents), highlighting an avenue for future studies using more granular or treatment-targeted patient-reported outcome (PRO) measures [<xref ref-type="bibr" rid="ref60">60</xref>].</p><p>Decision curve analysis indicated that most models provided greater net benefit than treat-all and treat-none strategies across threshold probabilities between 0.2 and 0.6, suggesting potential clinical usefulness within this range. As subsequent actions following risk identification are not clearly defined and may vary widely (see Di Meglio et al [<xref ref-type="bibr" rid="ref57">57</xref>] for a list of suggested interventions for patients with high risk of fatigue), the models should not be interpreted as directly guiding specific interventions. Rather, given that available options are often low risk and primarily involve the use of supportive resources, the models&#x2019; main value may lie in informing patient counseling and facilitating early, shared discussions about potential support needs.</p></sec><sec id="s4-3"><title>Model Fairness and Time Dynamic Performance</title><p>Model fairness analyses revealed disparities in model performance, notably among patients with lower educational status or frailty. However, there was no single risk group with the constant worst discrimination in all domains. Our findings echo concerns about algorithmic bias in health care ML models, exacerbating existing inequities in socioeconomic status, disability, and other characteristics [<xref ref-type="bibr" rid="ref61">61</xref>-<xref ref-type="bibr" rid="ref63">63</xref>]. This was reflected in the increased prevalence of impaired HRQoL across the selected risk groups, which nevertheless could not always be predicted correctly. Addressing these risks requires the use of fairness-aware ML techniques, such as reweighting, adversarial debiasing, or subgroup-specific calibration, to ensure equitable performance across diverse patient populations [<xref ref-type="bibr" rid="ref17">17</xref>]. Future work should explore these strategies to prevent the amplification of health care disparities.</p><p>Our implementation of time-dynamic prediction marks a promising methodological extension over traditional fixed-interval ML models for HRQoL. Enabled by a heterogeneous dataset, this approach better reflects real-world clinical care, where follow-up intervals vary. Importantly, we observed consistent model performance across different time spans. For long-term prediction, that is, spanning more than 1 year between assessments, this might reflect a stabilization of HRQoL. At the same time, the models also performed well during the first year after diagnosis, despite this period being marked by significant treatment-related fluctuations in HRQoL. This indicates that the models are capable of capturing both stable and dynamic phases of a patient&#x2019;s trajectory, making them applicable in both contexts. In line with the ESMO (European Society for Medical Oncology) clinical practice guideline for PRO use in clinical practice, which recommends integrating PRO results into clinical care [<xref ref-type="bibr" rid="ref64">64</xref>], such insights may inform supportive care planning by enabling the prioritization of patients who are likely to require timely interventions, while also helping patients develop more realistic expectations regarding their long-term HRQoL prognosis.</p><p>As our approach primarily served as a proof-of-concept, no direct comparisons with existing HRQoL models are currently available. Nevertheless, these encouraging results highlight the potential of time-dynamic modeling to address real-world clinical needs, warranting extension to other populations and settings. Future research is needed to compare this approach to static models.</p></sec><sec id="s4-4"><title>Strengths and Limitations</title><p>This study presents several key strengths. To our knowledge, it is the first ML approach to HRQoL prediction that incorporates time-dynamic modeling for patients with breast cancer, allowing for predictions at variable future time points rather than fixed intervals. Second, deriving our outcomes directly from anchor-based thresholds (patients reporting limitations in daily life, need for help or care, or worries of the patient or their partner or family) [<xref ref-type="bibr" rid="ref33">33</xref>] ensures that predictions are tied to clinically meaningful impairments. As such, the models can help identify which patients are more likely to develop problems in specific HRQoL domains at selected points in the future and who may benefit from further clinical attention. Considering that PRO data are increasingly collected in routine care and that the QLQ-C30 is among the most frequently used questionnaires in electronic systems [<xref ref-type="bibr" rid="ref65">65</xref>], our study shows that these data could be used more comprehensively to inform clinical teams and patients. Additionally, the use of a multicohort dataset, combining clinical trial data with real-world observational data, improves the model&#x2019;s validity. Importantly, we used external validation using a separate cohort to evaluate generalizability and illustrated the effects of post hoc recalibration. We also explicitly assessed predictive fairness, addressing a critical and often overlooked aspect of ML in health care by examining performance across subgroups and discussing bias mitigation strategies.</p><p>Nevertheless, this study has limitations. Most patients in our dataset were Dutch, which may limit the generalizability of findings to other countries. However, reference values for early patients with breast cancer demonstrate only slight variations across Europe [<xref ref-type="bibr" rid="ref66">66</xref>], and the models primarily rely on prior HRQoL rather than population-specific variables. This might suggest that their performance is not inherently tied to national context, and the models may be transferable to other similar countries, provided that health care systems, cultural backgrounds, and follow-up intensity are broadly comparable. Yet, model adoption into different settings must still be evaluated carefully. In addition, we are currently working to include further German and British data to expand our database and retrain our models with a more international population.</p><p>Second, even though we evaluated model performance in an RWD set and this might have reduced selection bias, there might still be an underrepresentation of certain minorities or risk groups in our data.</p><p>Furthermore, as we performed a secondary analysis on existing datasets not originally intended for this purpose, some potentially important predictors of HRQoL (eg, socioeconomic status or social support) were unavailable, which may have limited the performance of our models.</p><p>Additionally, we dichotomized the outcomes to facilitate clinical interpretation; this may have led to a loss of information and reduced predictive accuracy compared to modeling with the original continuous scale.</p><p>Further, the field of ML is evolving rapidly, and by the time results are published, newer architectures (eg, pretrained tabular foundation models [<xref ref-type="bibr" rid="ref67">67</xref>]) may already offer improved performance. Exploring such approaches was beyond the scope of this study but represents an important direction for future research.</p><p>Finally, while our models demonstrate promise, they remain preliminary with respect to clinical implementation, especially for a few selected scales showing poor calibration for certain rare symptoms. This limitation may be attributable not only to low event rates but also to the application of a single time-dynamic modeling framework across heterogeneous phases of the patient journey, raising the possibility that more phase-specific approaches (eg, during active treatment vs posttreatment or survivorship) could improve calibration for certain symptoms.</p><p>This mirrors a systemic issue in translational implementation, where HRQoL prediction models often fail to progress beyond proof-of-concept due to a combination of technical, operational, and contextual barriers [<xref ref-type="bibr" rid="ref68">68</xref>]. As outlined by Spencer et al [<xref ref-type="bibr" rid="ref69">69</xref>], both general ML deployment issues and PRO-specific challenges contribute to what they refer to as the &#x201C;leaky pipeline&#x201D; from model development to bedside application. Moreover, compliance with regulatory frameworks, such as the European Union Artificial Intelligence Act, necessitates not only robust prospective validation in real-world settings but also demonstrable alignment with ethical, safety, and stakeholder-involvement standards.</p></sec><sec id="s4-5"><title>Conclusions</title><p>Our findings support the future integration of ML into PRO-based clinical decision support systems, while also emphasizing the need to address fairness in predictive modeling. Importantly, the predicted impairments are clinically meaningful, as they identify patients at risk of future problems derived from anchor-based thresholds and enable more timely, targeted interventions. The time-dynamic nature of the predictions further increases their clinical utility by allowing risk estimation to be aligned with clinically relevant time horizons rather than fixed follow-up intervals. Future work should focus on improving model fairness, expanding dataset diversity, and evaluating clinical implementation in real-world oncology settings.</p></sec></sec></body><back><ack><p>We would like to acknowledge that the following members of the EORTC Quality of Life Group were involved in this work: Niclas J Hubel, Thijs G W van der Heijden, Belle H de Rooij, Kelly M de Ligt, Lonneke V van de Poll-Franse, Bernhard Holzner, Jens Lehmann.</p><p>We would like to thank Corneel Coens, PhD, for his help with identifying EORTC (European Organisation for Research and Treatment of Cancer) breast cancer trials; Pablo Reja, PhD, for all his advice surrounding data sharing agreementagreements and creating a draft data sharing agreement for us; Coralie Poncet, MSc, for preparing the EORTC AMAROS (After Mapping of the Axilla, Radiotherapy or Surgery?) data for this project; the NKI (Netherlands Cancer Institute) Scientific data administration, especially Melanie Singer-Van den Hout, MSc, for their data preparation of the NKI data; Henrike Bretveld, MSc, and Ghita Puts, MSc, from the Dutch cancer registry for clinical data preparation of UMBRELLA (Utrecht Cohort for Multiple Breast Cancer Intervention Studies and Long-Term Evaluation) and OPTIMUM (Towards Optimal Timing and Method for Promoting Sustained Adherence to Lifestyle and Body Weight Recommendations in Postmenopausal Breast Cancer Survivors); Nicole Horevoorts, MSc and the team of the PROFILES (Patient Reported Outcomes Following Initial Treatment and Long term Evaluation of Survivorship) registry for the health-related quality of life data preparation of UMBRELLA and OPTIMUM; the team research from the UMCU (University Medical Center Utrecht) division of imaging for providing the key to couple NKR (Netherlands Cancer Registry) and PROFILES data for UMBRELLA; August Zabernigg, MD from BKH Kufstein (District Hospital Kufstein) for providing the BKH Kufstein data; the NKI knowledge transfer and contracting department for all the help with the data-sharing agreements; Lonneke van de Poll-Franse, PhD, Jaap C Seidell, PhD, Floortje Mols, MD, Sandra van Cappellen-van Maldegem, MSc, Janneke van den Boom, BA, and Judith van Valenberg, MSc, for the execution of the OPTIMUM study.</p><p>Disclosure of delegation to generative artificial intelligence (GenAI): The authors declare the use of generative AI in the research and writing process. According to the GAIDeT (Generative Artificial Intelligence Delegation Taxonomy; 2025), the following tasks were delegated to GenAI tools under full human supervision: (1) code optimization, (2) proofreading and editing, and (3) summarizing text. The GenAI tool used was ChatGPT-5 (OpenAI). Responsibility for this final paper lies entirely with the authors. GenAI tools are not listed as authors and do not bear responsibility for the outcomes. Declaration submitted by collective responsibility.</p></ack><notes><sec><title>Funding</title><p>This research was funded by the European Organisation for Research and Treatment of Cancer (EORTC) Quality of Life Group (007-2022; EORTC 2052).This research was funded by the EORTC Quality of Life Group (007-2022; EORTC 2052). The funder had no involvement in this study&#x2019;s design, data collection, analysis, interpretation, or the writing of this paper.</p></sec><sec><title>Data Availability</title><p>The data supporting this study's findings are available from each cohort study&#x2019;s principal investigator. Restrictions apply to the availability of these data, which were used under license for this study. The code of our analyses can be accessed through GitHub [<xref ref-type="bibr" rid="ref70">70</xref>].</p></sec></notes><fn-group><fn fn-type="con"><p>Conceptualization: NJH, EORTC Quality of Life Group</p><p>Data curation: NJH, TGWvdH, EORTC Quality of Life Group</p><p>Formal analysis: NJH, BM, EORTC Quality of Life Group</p><p>Investigation: NJH, TGWvdH, EORTC Quality of Life Group</p><p>Methodology: NJH, BM, EORTC Quality of Life Group</p><p>Project administration: NJH, TGWvdH, EORTC Quality of Life Group</p><p>Resources: LVvdP-F, BH, EORTC Quality of Life Group</p><p>Supervision: LVvdP-F, BH, JL, EORTC Quality of Life Group</p><p>Writing &#x2013; original draft: NJH, BM, JL, EORTC Quality of Life Group</p><p>Writing &#x2013; review &#x0026; editing: NJH, TGWvdH, BM, BHdR, KMdL, HMV, MH, VA, LVvdP-F, BH, JL, EORTC Quality of Life Group</p><p>Data provision: KMdL, HMV, MH, VA, EORTC Quality of Life Group</p></fn><fn fn-type="conflict"><p>NJH reports employment by ACMIT GmbH - Austrian Center for Medical Innovation and Technology, Wiener Neustadt, Austria, outside the submitted work.</p><p>HMV reports research funding by Philips, Elekta, European Commission, Dutch Research Council, and Dutch Cancer Foundation outside of the submitted work.</p><p>BH holds shares in the company Evaluation Software Development GmbH, Innsbruck, Austria. JL reports consultancy for Evaluation Software Development and a research grant from Takeda, both outside of the submitted work.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">AMAROS </term><def><p>After Mapping of the Axilla, Radiotherapy or Surgery?</p></def></def-item><def-item><term id="abb2">AP</term><def><p>appetite loss</p></def></def-item><def-item><term id="abb3">AUC</term><def><p>area under the receiver operating characteristic curve</p></def></def-item><def-item><term id="abb4">BALANCE</term><def><p>big data in patients with breast cancer</p></def></def-item><def-item><term id="abb5">ECE</term><def><p>expected calibration error</p></def></def-item><def-item><term id="abb6">EORTC</term><def><p>European Organisation for Research and Treatment of Cancer</p></def></def-item><def-item><term id="abb7">ER</term><def><p>estrogen receptor</p></def></def-item><def-item><term id="abb8">ESMO</term><def><p>European Society for Medical Oncology</p></def></def-item><def-item><term id="abb9">HRQoL</term><def><p>health-related quality of life</p></def></def-item><def-item><term id="abb10">LOCF</term><def><p>last observation carried forward</p></def></def-item><def-item><term id="abb11">ML</term><def><p>machine learning</p></def></def-item><def-item><term id="abb12">NKI</term><def><p>Netherlands Cancer Institute</p></def></def-item><def-item><term id="abb13">OPTIMUM</term><def><p>Towards Optimal Timing and Method for Promoting Sustained Adherence to Lifestyle and Body Weight Recommendations in Postmenopausal Breast Cancer Survivors</p></def></def-item><def-item><term id="abb14">PRO</term><def><p>patient-reported outcome</p></def></def-item><def-item><term id="abb15">QLQ</term><def><p>Quality of Life Core Questionnaire</p></def></def-item><def-item><term id="abb16">RWD</term><def><p>real world data</p></def></def-item><def-item><term id="abb17">TRIPOD</term><def><p>Transparent Reporting of a Multivariable Prediction Model for Individual Prognosis or Diagnosis</p></def></def-item><def-item><term id="abb18">UMBRELLA</term><def><p>Utrecht Cohort for Multiple Breast Cancer Intervention Studies and Long-Term Evaluation</p></def></def-item><def-item><term id="abb19">VERDI</term><def><p>Verlauf der Diagnostischen Abkl&#x00E4;rung</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Harbeck</surname><given-names>N</given-names> </name><name name-style="western"><surname>Gnant</surname><given-names>M</given-names> </name></person-group><article-title>Breast cancer</article-title><source>Lancet</source><year>2017</year><month>03</month><day>18</day><volume>389</volume><issue>10074</issue><fpage>1134</fpage><lpage>1150</lpage><pub-id pub-id-type="doi">10.1016/S0140-6736(16)31891-8</pub-id><pub-id pub-id-type="medline">27865536</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Anderson-Hanley</surname><given-names>C</given-names> </name><name name-style="western"><surname>Sherman</surname><given-names>ML</given-names> </name><name name-style="western"><surname>Riggs</surname><given-names>R</given-names> </name><name name-style="western"><surname>Agocha</surname><given-names>VB</given-names> </name><name name-style="western"><surname>Compas</surname><given-names>BE</given-names> </name></person-group><article-title>Neuropsychological effects of treatments for adults with cancer: a meta-analysis and review of the literature</article-title><source>J Int Neuropsychol Soc</source><year>2003</year><month>11</month><volume>9</volume><issue>7</issue><fpage>967</fpage><lpage>982</lpage><pub-id pub-id-type="doi">10.1017/S1355617703970019</pub-id><pub-id pub-id-type="medline">14738279</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mokhtari-Hessari</surname><given-names>P</given-names> </name><name name-style="western"><surname>Montazeri</surname><given-names>A</given-names> </name></person-group><article-title>Health-related quality of life in breast cancer patients: review of reviews from 2008 to 2018</article-title><source>Health Qual Life Outcomes</source><year>2020</year><month>12</month><volume>18</volume><issue>1</issue><fpage>1</fpage><lpage>25</lpage><pub-id pub-id-type="doi">10.1186/s12955-020-01591-x</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>von Heymann-Horan</surname><given-names>AB</given-names> </name><name name-style="western"><surname>Dalton</surname><given-names>SO</given-names> </name><name name-style="western"><surname>Dziekanska</surname><given-names>A</given-names> </name><etal/></person-group><article-title>Unmet needs of women with breast cancer during and after primary treatment: a prospective study in Denmark</article-title><source>Acta Oncol</source><year>2013</year><month>02</month><volume>52</volume><issue>2</issue><fpage>382</fpage><lpage>390</lpage><pub-id pub-id-type="doi">10.3109/0284186X.2012.746468</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Alfano</surname><given-names>CM</given-names> </name><name name-style="western"><surname>Mayer</surname><given-names>DK</given-names> </name><name name-style="western"><surname>Bhatia</surname><given-names>S</given-names> </name><etal/></person-group><article-title>Implementing personalized pathways for cancer follow&#x2010;up care in the United States: proceedings from an American Cancer Society&#x2013;American Society of Clinical Oncology summit</article-title><source>CA A Cancer J Clinicians</source><year>2019</year><month>05</month><volume>69</volume><issue>3</issue><fpage>234</fpage><lpage>247</lpage><pub-id pub-id-type="doi">10.3322/caac.21558</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Karri</surname><given-names>R</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>YPP</given-names> </name><name name-style="western"><surname>Drummond</surname><given-names>KJ</given-names> </name></person-group><article-title>Using machine learning to predict health-related quality of life outcomes in patients with low grade glioma, meningioma, and acoustic neuroma</article-title><source>PLoS ONE</source><year>2022</year><volume>17</volume><issue>5</issue><fpage>e0267931</fpage><pub-id pub-id-type="doi">10.1371/journal.pone.0267931</pub-id><pub-id pub-id-type="medline">35507629</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>van der Heijden</surname><given-names>TGW</given-names> </name><name name-style="western"><surname>de Ligt</surname><given-names>KM</given-names> </name><name name-style="western"><surname>Hubel</surname><given-names>NJ</given-names> </name><etal/></person-group><article-title>Exploring the role of health-related quality of life measures in predictive modelling for oncology: a systematic review</article-title><source>Qual Life Res</source><year>2025</year><month>02</month><volume>34</volume><issue>2</issue><fpage>305</fpage><lpage>323</lpage><pub-id pub-id-type="doi">10.1007/s11136-024-03820-y</pub-id><pub-id pub-id-type="medline">39652111</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mertz</surname><given-names>S</given-names> </name><name name-style="western"><surname>Benjamin</surname><given-names>C</given-names> </name><name name-style="western"><surname>Girvalaki</surname><given-names>C</given-names> </name><etal/></person-group><article-title>Progression-free survival and quality of life in metastatic breast cancer: the patient perspective</article-title><source>Breast</source><year>2022</year><month>10</month><volume>65</volume><fpage>84</fpage><lpage>90</lpage><pub-id pub-id-type="doi">10.1016/j.breast.2022.07.006</pub-id><pub-id pub-id-type="medline">35870420</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Yeo</surname><given-names>HY</given-names> </name><name name-style="western"><surname>Liew</surname><given-names>AC</given-names> </name><name name-style="western"><surname>Chan</surname><given-names>SJ</given-names> </name><name name-style="western"><surname>Anwar</surname><given-names>M</given-names> </name><name name-style="western"><surname>Han</surname><given-names>CHW</given-names> </name><name name-style="western"><surname>Marra</surname><given-names>CA</given-names> </name></person-group><article-title>Understanding patient preferences regarding the important determinants of breast cancer treatment: a narrative scoping review</article-title><source>Patient Prefer Adherence</source><year>2023</year><volume>17</volume><fpage>2679</fpage><lpage>2706</lpage><pub-id pub-id-type="doi">10.2147/PPA.S432821</pub-id><pub-id pub-id-type="medline">37927344</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Riley</surname><given-names>RD</given-names> </name><name name-style="western"><surname>Ensor</surname><given-names>J</given-names> </name><name name-style="western"><surname>Snell</surname><given-names>KIE</given-names> </name><etal/></person-group><article-title>Calculating the sample size required for developing a clinical prediction model</article-title><source>BMJ</source><year>2020</year><month>03</month><day>18</day><volume>368</volume><fpage>m441</fpage><pub-id pub-id-type="doi">10.1136/bmj.m441</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>van der Heijden</surname><given-names>TGW</given-names> </name><name name-style="western"><surname>Hubel</surname><given-names>NJ</given-names> </name><name name-style="western"><surname>de Ligt</surname><given-names>KM</given-names> </name><etal/></person-group><article-title>Opportunities and challenges in pooling health-related quality-of-life data for prediction modeling in breast cancer across Europe: lessons from the EORTC BALANCE project</article-title><source>ESMO Real World Data Digit Oncol</source><year>2025</year><month>09</month><volume>9</volume><fpage>100172</fpage><pub-id pub-id-type="doi">10.1016/j.esmorw.2025.100172</pub-id><pub-id pub-id-type="medline">41646212</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Krepper</surname><given-names>D</given-names> </name><name name-style="western"><surname>Cesari</surname><given-names>M</given-names> </name><name name-style="western"><surname>Hubel</surname><given-names>NJ</given-names> </name><name name-style="western"><surname>Zelger</surname><given-names>P</given-names> </name><name name-style="western"><surname>Sztankay</surname><given-names>MJ</given-names> </name></person-group><article-title>Machine learning models including patient-reported outcome data in oncology: a systematic literature review and analysis of their reporting quality</article-title><source>J Patient Rep Outcomes</source><year>2024</year><month>11</month><day>5</day><volume>8</volume><issue>1</issue><fpage>126</fpage><pub-id pub-id-type="doi">10.1186/s41687-024-00808-7</pub-id><pub-id pub-id-type="medline">39499409</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Pfob</surname><given-names>A</given-names> </name><name name-style="western"><surname>Mehrara</surname><given-names>BJ</given-names> </name><name name-style="western"><surname>Nelson</surname><given-names>JA</given-names> </name><name name-style="western"><surname>Wilkins</surname><given-names>EG</given-names> </name><name name-style="western"><surname>Pusic</surname><given-names>AL</given-names> </name><name name-style="western"><surname>Sidey-Gibbons</surname><given-names>C</given-names> </name></person-group><article-title>Machine learning to predict individual patient-reported outcomes at 2-year follow-up for women undergoing cancer-related mastectomy and breast reconstruction (INSPiRED-001)</article-title><source>Breast</source><year>2021</year><month>12</month><volume>60</volume><fpage>111</fpage><lpage>122</lpage><pub-id pub-id-type="doi">10.1016/j.breast.2021.09.009</pub-id><pub-id pub-id-type="medline">34619573</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Shi</surname><given-names>HY</given-names> </name><name name-style="western"><surname>Tsai</surname><given-names>JT</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>YM</given-names> </name><name name-style="western"><surname>Culbertson</surname><given-names>R</given-names> </name><name name-style="western"><surname>Chang</surname><given-names>HT</given-names> </name><name name-style="western"><surname>Hou</surname><given-names>MF</given-names> </name></person-group><article-title>Predicting two-year quality of life after breast cancer surgery using artificial neural network and linear regression models</article-title><source>Breast Cancer Res Treat</source><year>2012</year><month>08</month><volume>135</volume><issue>1</issue><fpage>221</fpage><lpage>229</lpage><pub-id pub-id-type="doi">10.1007/s10549-012-2174-6</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sharifi</surname><given-names>F</given-names> </name><name name-style="western"><surname>Mohammed</surname><given-names>E</given-names> </name><name name-style="western"><surname>Crump</surname><given-names>T</given-names> </name><name name-style="western"><surname>Far</surname><given-names>BH</given-names> </name></person-group><article-title>Explainable analytics to predict the quality of life in patients with prostate cancer from longitudinal data</article-title><source>Appl Artif Intell</source><year>2022</year><month>12</month><day>31</day><volume>36</volume><issue>1</issue><fpage>2055393</fpage><pub-id pub-id-type="doi">10.1080/08839514.2022.2055393</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Castelnovo</surname><given-names>A</given-names> </name><name name-style="western"><surname>Crupi</surname><given-names>R</given-names> </name><name name-style="western"><surname>Greco</surname><given-names>G</given-names> </name><name name-style="western"><surname>Regoli</surname><given-names>D</given-names> </name><name name-style="western"><surname>Penco</surname><given-names>IG</given-names> </name><name name-style="western"><surname>Cosentini</surname><given-names>AC</given-names> </name></person-group><article-title>A clarification of the nuances in the fairness metrics landscape</article-title><source>Sci Rep</source><year>2022</year><month>03</month><day>10</day><volume>12</volume><issue>1</issue><fpage>4209</fpage><pub-id pub-id-type="doi">10.1038/s41598-022-07939-1</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mehrabi</surname><given-names>N</given-names> </name><name name-style="western"><surname>Morstatter</surname><given-names>F</given-names> </name><name name-style="western"><surname>Saxena</surname><given-names>N</given-names> </name><name name-style="western"><surname>Lerman</surname><given-names>K</given-names> </name><name name-style="western"><surname>Galstyan</surname><given-names>A</given-names> </name></person-group><article-title>A survey on bias and fairness in machine learning</article-title><source>ACM Comput Surv</source><year>2022</year><month>07</month><day>31</day><volume>54</volume><issue>6</issue><fpage>1</fpage><lpage>35</lpage><pub-id pub-id-type="doi">10.1145/3457607</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Rajkomar</surname><given-names>A</given-names> </name><name name-style="western"><surname>Hardt</surname><given-names>M</given-names> </name><name name-style="western"><surname>Howell</surname><given-names>MD</given-names> </name><name name-style="western"><surname>Corrado</surname><given-names>G</given-names> </name><name name-style="western"><surname>Chin</surname><given-names>MH</given-names> </name></person-group><article-title>Ensuring fairness in machine learning to advance health equity</article-title><source>Ann Intern Med</source><year>2018</year><month>12</month><day>18</day><volume>169</volume><issue>12</issue><fpage>866</fpage><lpage>872</lpage><pub-id pub-id-type="doi">10.7326/M18-1990</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chen</surname><given-names>MS</given-names> </name><name name-style="western"><surname>Lara</surname><given-names>PN</given-names> </name><name name-style="western"><surname>Dang</surname><given-names>JHT</given-names> </name><name name-style="western"><surname>Paterniti</surname><given-names>DA</given-names> </name><name name-style="western"><surname>Kelly</surname><given-names>K</given-names> </name></person-group><article-title>Twenty years post-NIH Revitalization Act: Enhancing Minority Participation in Clinical Trials (EMPaCT): laying the groundwork for improving minority clinical trial accrual: renewing the case for enhancing minority participation in cancer clinical trials</article-title><source>Cancer</source><year>2014</year><month>04</month><day>1</day><volume>120 Suppl 7</volume><issue>7</issue><fpage>1091</fpage><lpage>1096</lpage><pub-id pub-id-type="doi">10.1002/cncr.28575</pub-id><pub-id pub-id-type="medline">24643646</pub-id></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Collins</surname><given-names>GS</given-names> </name><name name-style="western"><surname>Moons</surname><given-names>KGM</given-names> </name><name name-style="western"><surname>Dhiman</surname><given-names>P</given-names> </name><etal/></person-group><article-title>TRIPOD+AI statement: updated guidance for reporting clinical prediction models that use regression or machine learning methods</article-title><source>BMJ</source><year>2024</year><month>04</month><day>16</day><volume>385</volume><fpage>e078378</fpage><pub-id pub-id-type="doi">10.1136/bmj-2023-078378</pub-id><pub-id pub-id-type="medline">38626948</pub-id></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Luo</surname><given-names>W</given-names> </name><name name-style="western"><surname>Phung</surname><given-names>D</given-names> </name><name name-style="western"><surname>Tran</surname><given-names>T</given-names> </name><etal/></person-group><article-title>Guidelines for developing and reporting machine learning predictive models in biomedical research: a multidisciplinary view</article-title><source>J Med Internet Res</source><year>2016</year><month>12</month><day>16</day><volume>18</volume><issue>12</issue><fpage>e323</fpage><pub-id pub-id-type="doi">10.2196/jmir.5870</pub-id><pub-id pub-id-type="medline">27986644</pub-id></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Straver</surname><given-names>ME</given-names> </name><name name-style="western"><surname>Meijnen</surname><given-names>P</given-names> </name><name name-style="western"><surname>van Tienhoven</surname><given-names>G</given-names> </name><etal/></person-group><article-title>Sentinel node identification rate and nodal involvement in the EORTC 10981-22023 AMAROS trial</article-title><source>Ann Surg Oncol</source><year>2010</year><month>07</month><volume>17</volume><issue>7</issue><fpage>1854</fpage><lpage>1861</lpage><pub-id pub-id-type="doi">10.1245/s10434-010-0945-z</pub-id></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Boomstra</surname><given-names>E</given-names> </name><name name-style="western"><surname>Walraven</surname><given-names>I</given-names> </name><name name-style="western"><surname>van der Ploeg</surname><given-names>IMC</given-names> </name><etal/></person-group><article-title>Moving beyond barriers: a mixed-method study to develop evidence-based strategies to improve implementation of PROMs in clinical oncology care</article-title><source>Qual Life Res</source><year>2025</year><month>01</month><volume>34</volume><issue>1</issue><fpage>173</fpage><lpage>188</lpage><pub-id pub-id-type="doi">10.1007/s11136-024-03787-w</pub-id><pub-id pub-id-type="medline">39302555</pub-id></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wintner</surname><given-names>LM</given-names> </name><name name-style="western"><surname>Giesinger</surname><given-names>JM</given-names> </name><name name-style="western"><surname>Sztankay</surname><given-names>M</given-names> </name><name name-style="western"><surname>Bottomley</surname><given-names>A</given-names> </name><name name-style="western"><surname>Holzner</surname><given-names>B</given-names> </name><collab>EORTC Quality of Life Group</collab></person-group><article-title>Evaluating the use of the EORTC patient-reported outcome measures for improving inter-rater reliability of CTCAE ratings in a mixed population of cancer patients: study protocol for a randomized controlled trial</article-title><source>Trials</source><year>2020</year><month>10</month><day>13</day><volume>21</volume><issue>1</issue><fpage>849</fpage><pub-id pub-id-type="doi">10.1186/s13063-020-04745-w</pub-id><pub-id pub-id-type="medline">33050917</pub-id></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Young-Afat</surname><given-names>DA</given-names> </name><name name-style="western"><surname>van Gils</surname><given-names>CH</given-names> </name><name name-style="western"><surname>van den Bongard</surname><given-names>HJGD</given-names> </name><name name-style="western"><surname>Verkooijen</surname><given-names>HM</given-names> </name><collab>on behalf of the UMBRELLA Study Group</collab></person-group><article-title>The Utrecht Cohort for Multiple Breast Cancer Intervention Studies and Long-Term Evaluation (UMBRELLA): objectives, design, and baseline results</article-title><source>Breast Cancer Res Treat</source><year>2017</year><month>07</month><volume>164</volume><issue>2</issue><fpage>445</fpage><lpage>450</lpage><pub-id pub-id-type="doi">10.1007/s10549-017-4242-4</pub-id></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>van Cappellen-van Maldegem</surname><given-names>SJM</given-names> </name><name name-style="western"><surname>Mols</surname><given-names>F</given-names> </name><name name-style="western"><surname>Horevoorts</surname><given-names>N</given-names> </name><etal/></person-group><article-title>Towards Optimal Timing and Method for Promoting Sustained Adherence to Lifestyle and Body Weight Recommendations in Postmenopausal Breast Cancer Survivors (the OPTIMUM-study): protocol for a longitudinal mixed-method study</article-title><source>BMC WOMENS Health</source><year>2021</year><month>07</month><day>6</day><volume>21</volume><issue>1</issue><fpage>268</fpage><pub-id pub-id-type="doi">10.1186/s12905-021-01406-1</pub-id><pub-id pub-id-type="medline">34229690</pub-id></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Arndt</surname><given-names>V</given-names> </name><name name-style="western"><surname>St&#x00FC;rmer</surname><given-names>T</given-names> </name><name name-style="western"><surname>Stegmaier</surname><given-names>C</given-names> </name><name name-style="western"><surname>Ziegler</surname><given-names>H</given-names> </name><name name-style="western"><surname>Dhom</surname><given-names>G</given-names> </name><name name-style="western"><surname>Brenner</surname><given-names>H</given-names> </name></person-group><article-title>Socio-demographic factors, health behavior and late-stage diagnosis of breast cancer in Germany: a population-based study</article-title><source>J Clin Epidemiol</source><year>2001</year><month>07</month><volume>54</volume><issue>7</issue><fpage>719</fpage><lpage>727</lpage><pub-id pub-id-type="doi">10.1016/s0895-4356(00)00351-6</pub-id><pub-id pub-id-type="medline">11438413</pub-id></nlm-citation></ref><ref id="ref28"><label>28</label><nlm-citation citation-type="web"><source>R Foundation for Statistical Computing</source><access-date>2026-04-14</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.R-project.org/">https://www.R-project.org/</ext-link></comment></nlm-citation></ref><ref id="ref29"><label>29</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Aaronson</surname><given-names>NK</given-names> </name><name name-style="western"><surname>Ahmedzai</surname><given-names>S</given-names> </name><name name-style="western"><surname>Bergman</surname><given-names>B</given-names> </name><etal/></person-group><article-title>The European Organization for Research and Treatment of Cancer QLQ-C30: a quality-of-life instrument for use in international clinical trials in oncology</article-title><source>JNCI Journal of the National Cancer Institute</source><year>1993</year><month>03</month><day>3</day><volume>85</volume><issue>5</issue><fpage>365</fpage><lpage>376</lpage><pub-id pub-id-type="doi">10.1093/jnci/85.5.365</pub-id></nlm-citation></ref><ref id="ref30"><label>30</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sprangers</surname><given-names>MA</given-names> </name><name name-style="western"><surname>Groenvold</surname><given-names>M</given-names> </name><name name-style="western"><surname>Arraras</surname><given-names>JI</given-names> </name><etal/></person-group><article-title>The European Organization for Research and Treatment of Cancer breast cancer-specific quality-of-life questionnaire module: first results from a three-country field study</article-title><source>J Clin Oncol</source><year>1996</year><month>10</month><volume>14</volume><issue>10</issue><fpage>2756</fpage><lpage>2768</lpage><pub-id pub-id-type="doi">10.1200/JCO.1996.14.10.2756</pub-id><pub-id pub-id-type="medline">8874337</pub-id></nlm-citation></ref><ref id="ref31"><label>31</label><nlm-citation citation-type="web"><article-title>IterativeImputer</article-title><source>scikit-learn</source><access-date>2026-04-14</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://scikit-learn.org/stable/modules/generated/sklearn.impute.IterativeImputer.html">https://scikit-learn.org/stable/modules/generated/sklearn.impute.IterativeImputer.html</ext-link></comment></nlm-citation></ref><ref id="ref32"><label>32</label><nlm-citation citation-type="report"><person-group person-group-type="author"><name name-style="western"><surname>Fayers</surname><given-names>PM</given-names> </name><name name-style="western"><surname>Aaronson</surname><given-names>NK</given-names> </name><name name-style="western"><surname>Bjordal</surname><given-names>K</given-names> </name><etal/></person-group><article-title>The EORTC QLQ-C30 scoring manual (3rd edition)</article-title><source>European Organisation for Research and Treatment of Cancer, Brussels</source><year>2001</year><access-date>2026-04-18</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.eortc.org/app/uploads/sites/2/2018/02/SCmanual.pdf">https://www.eortc.org/app/uploads/sites/2/2018/02/SCmanual.pdf</ext-link></comment></nlm-citation></ref><ref id="ref33"><label>33</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Giesinger</surname><given-names>JM</given-names> </name><name name-style="western"><surname>Loth</surname><given-names>FLC</given-names> </name><name name-style="western"><surname>Aaronson</surname><given-names>NK</given-names> </name><etal/></person-group><article-title>Thresholds for clinical importance were established to improve interpretation of the EORTC QLQ-C30 in clinical practice and research</article-title><source>J Clin Epidemiol</source><year>2020</year><month>02</month><volume>118</volume><fpage>1</fpage><lpage>8</lpage><pub-id pub-id-type="doi">10.1016/j.jclinepi.2019.10.003</pub-id></nlm-citation></ref><ref id="ref34"><label>34</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Pedregosa</surname><given-names>F</given-names> </name><name name-style="western"><surname>Varoquaux</surname><given-names>G</given-names> </name><name name-style="western"><surname>Gramfort</surname><given-names>A</given-names> </name><etal/></person-group><article-title>Scikit-learn: machine learning in Python</article-title><source>J Mach Learn Res</source><year>2011</year><access-date>2026-04-14</access-date><volume>12</volume><issue>85</issue><fpage>2825</fpage><lpage>2830</lpage><comment><ext-link ext-link-type="uri" xlink:href="https://jmlr.org/papers/volume12/pedregosa11a/pedregosa11a.pdf">https://jmlr.org/papers/volume12/pedregosa11a/pedregosa11a.pdf</ext-link></comment></nlm-citation></ref><ref id="ref35"><label>35</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Adiprakoso</surname><given-names>D</given-names> </name><name name-style="western"><surname>Katsimpokis</surname><given-names>D</given-names> </name><name name-style="western"><surname>Oerlemans</surname><given-names>S</given-names> </name><etal/></person-group><article-title>Development of a prediction model for clinically-relevant fatigue: a multi-cancer approach</article-title><source>Qual Life Res</source><year>2025</year><month>01</month><volume>34</volume><issue>1</issue><fpage>231</fpage><lpage>245</lpage><pub-id pub-id-type="doi">10.1007/s11136-024-03807-9</pub-id><pub-id pub-id-type="medline">39516438</pub-id></nlm-citation></ref><ref id="ref36"><label>36</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>W&#x00F3;jcik</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Dimitrova</surname><given-names>V</given-names> </name><name name-style="western"><surname>Warrington</surname><given-names>L</given-names> </name><name name-style="western"><surname>Velikova</surname><given-names>G</given-names> </name><name name-style="western"><surname>Absolom</surname><given-names>K</given-names> </name></person-group><article-title>Using machine learning to predict unplanned hospital utilization and chemotherapy management from patient-reported outcome measures</article-title><source>JCO Clin Cancer Inform</source><year>2024</year><month>04</month><volume>8</volume><fpage>e2300264</fpage><pub-id pub-id-type="doi">10.1200/CCI.23.00264</pub-id><pub-id pub-id-type="medline">38669610</pub-id></nlm-citation></ref><ref id="ref37"><label>37</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bradley</surname><given-names>AP</given-names> </name></person-group><article-title>The use of the area under the ROC curve in the evaluation of machine learning algorithms</article-title><source>Pattern Recognit DAGM</source><year>1997</year><month>07</month><volume>30</volume><issue>7</issue><fpage>1145</fpage><lpage>1159</lpage><pub-id pub-id-type="doi">10.1016/S0031-3203(96)00142-2</pub-id></nlm-citation></ref><ref id="ref38"><label>38</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Megahed</surname><given-names>FM</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>YJ</given-names> </name><name name-style="western"><surname>Megahed</surname><given-names>A</given-names> </name><name name-style="western"><surname>Ong</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Altman</surname><given-names>N</given-names> </name><name name-style="western"><surname>Krzywinski</surname><given-names>M</given-names> </name></person-group><article-title>The class imbalance problem</article-title><source>Nat Methods</source><year>2021</year><month>11</month><volume>18</volume><issue>11</issue><fpage>1270</fpage><lpage>1272</lpage><pub-id pub-id-type="doi">10.1038/s41592-021-01302-4</pub-id></nlm-citation></ref><ref id="ref39"><label>39</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Steyerberg</surname><given-names>EW</given-names> </name></person-group><source>Clinical Prediction Models: A Practical Approach to Development, Validation, and Updating</source><year>2019</year><publisher-name>Springer Cham</publisher-name><pub-id pub-id-type="doi">10.1007/978-3-030-16399-0</pub-id><pub-id pub-id-type="other">978-3-030-16398-3</pub-id></nlm-citation></ref><ref id="ref40"><label>40</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Karahalios</surname><given-names>A</given-names> </name><name name-style="western"><surname>Baglietto</surname><given-names>L</given-names> </name><name name-style="western"><surname>Carlin</surname><given-names>JB</given-names> </name><name name-style="western"><surname>English</surname><given-names>DR</given-names> </name><name name-style="western"><surname>Simpson</surname><given-names>JA</given-names> </name></person-group><article-title>A review of the reporting and handling of missing data in cohort studies with repeated assessment of exposure measures</article-title><source>BMC Med Res Methodol</source><year>2012</year><month>07</month><day>11</day><volume>12</volume><issue>96</issue><fpage>96</fpage><pub-id pub-id-type="doi">10.1186/1471-2288-12-96</pub-id><pub-id pub-id-type="medline">22784200</pub-id></nlm-citation></ref><ref id="ref41"><label>41</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Leyrat</surname><given-names>C</given-names> </name><name name-style="western"><surname>Carpenter</surname><given-names>JR</given-names> </name><name name-style="western"><surname>Bailly</surname><given-names>S</given-names> </name><name name-style="western"><surname>Williamson</surname><given-names>EJ</given-names> </name></person-group><article-title>Common methods for handling missing data in marginal structural models: what works and why</article-title><source>Am J Epidemiol</source><year>2021</year><month>04</month><day>6</day><volume>190</volume><issue>4</issue><fpage>663</fpage><lpage>672</lpage><pub-id pub-id-type="doi">10.1093/aje/kwaa225</pub-id></nlm-citation></ref><ref id="ref42"><label>42</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Steyerberg</surname><given-names>EW</given-names> </name><name name-style="western"><surname>Harrell Jr</surname><given-names>FE</given-names> </name></person-group><article-title>Prediction models need appropriate internal, internal-external, and external validation</article-title><source>J Clin Epidemiol</source><year>2016</year><month>01</month><volume>69</volume><fpage>245</fpage><lpage>247</lpage><pub-id pub-id-type="doi">10.1016/j.jclinepi.2015.04.005</pub-id><pub-id pub-id-type="medline">25981519</pub-id></nlm-citation></ref><ref id="ref43"><label>43</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Van Calster</surname><given-names>B</given-names> </name><name name-style="western"><surname>McLernon</surname><given-names>DJ</given-names> </name><name name-style="western"><surname>van Smeden</surname><given-names>M</given-names> </name><name name-style="western"><surname>Wynants</surname><given-names>L</given-names> </name><name name-style="western"><surname>Steyerberg</surname><given-names>EW</given-names> </name><collab>Topic Group &#x2018;Evaluating diagnostic tests and prediction models&#x2019; of the STRATOS initiative</collab></person-group><article-title>Calibration: the Achilles heel of predictive analytics</article-title><source>BMC Med</source><year>2019</year><month>12</month><day>16</day><volume>17</volume><issue>1</issue><fpage>230</fpage><pub-id pub-id-type="doi">10.1186/s12916-019-1466-7</pub-id><pub-id pub-id-type="medline">31842878</pub-id></nlm-citation></ref><ref id="ref44"><label>44</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>B&#x0142;asiok</surname><given-names>J</given-names> </name><name name-style="western"><surname>Nakkiran</surname><given-names>P</given-names> </name></person-group><article-title>Smooth ECE: principled reliability diagrams via kernel smoothing</article-title><source>arXiv</source><comment>Preprint posted online on  Sep 21, 2023</comment><pub-id pub-id-type="doi">10.48550/ARXIV.2309.12236</pub-id></nlm-citation></ref><ref id="ref45"><label>45</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Brier</surname><given-names>GW</given-names> </name></person-group><article-title>Verification of forecasts expressed in terms of probability</article-title><source>Mon Wea Rev</source><year>1950</year><month>01</month><volume>78</volume><issue>1</issue><fpage>1</fpage><lpage>3</lpage><pub-id pub-id-type="doi">10.1175/1520-0493(1950)078&#x003C;0001:VOFEIT&#x003E;2.0.CO;2</pub-id></nlm-citation></ref><ref id="ref46"><label>46</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Vickers</surname><given-names>AJ</given-names> </name><name name-style="western"><surname>Elkin</surname><given-names>EB</given-names> </name></person-group><article-title>Decision curve analysis: a novel method for evaluating prediction models</article-title><source>Med Decis Making</source><year>2006</year><volume>26</volume><issue>6</issue><fpage>565</fpage><lpage>574</lpage><pub-id pub-id-type="doi">10.1177/0272989X06295361</pub-id><pub-id pub-id-type="medline">17099194</pub-id></nlm-citation></ref><ref id="ref47"><label>47</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Van Calster</surname><given-names>B</given-names> </name><name name-style="western"><surname>Wynants</surname><given-names>L</given-names> </name><name name-style="western"><surname>Verbeek</surname><given-names>JFM</given-names> </name><etal/></person-group><article-title>Reporting and interpreting decision curve analysis: a guide for investigators</article-title><source>Eur Urol</source><year>2018</year><month>12</month><volume>74</volume><issue>6</issue><fpage>796</fpage><lpage>804</lpage><pub-id pub-id-type="doi">10.1016/j.eururo.2018.08.038</pub-id><pub-id pub-id-type="medline">30241973</pub-id></nlm-citation></ref><ref id="ref48"><label>48</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Tack</surname><given-names>L</given-names> </name><name name-style="western"><surname>Schofield</surname><given-names>P</given-names> </name><name name-style="western"><surname>Boterberg</surname><given-names>T</given-names> </name><name name-style="western"><surname>Parris</surname><given-names>CN</given-names> </name><name name-style="western"><surname>Debruyne</surname><given-names>PR</given-names> </name></person-group><article-title>Editorial: clinical cancer research in vulnerable populations</article-title><source>Front Oncol</source><year>2023</year><volume>13</volume><fpage>1166714</fpage><pub-id pub-id-type="doi">10.3389/fonc.2023.1166714</pub-id><pub-id pub-id-type="medline">36937380</pub-id></nlm-citation></ref><ref id="ref49"><label>49</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Murugappan</surname><given-names>MN</given-names> </name><name name-style="western"><surname>King-Kallimanis</surname><given-names>BL</given-names> </name><name name-style="western"><surname>Bhatnagar</surname><given-names>V</given-names> </name><etal/></person-group><article-title>Patient-Reported Frailty Phenotype (PRFP) vs. International Myeloma Working Group frailty index (IMWG FI) proxy: a comparison between two approaches to measuring frailty</article-title><source>J Geriatr Oncol</source><year>2024</year><month>03</month><volume>15</volume><issue>2</issue><fpage>101681</fpage><pub-id pub-id-type="doi">10.1016/j.jgo.2023.101681</pub-id></nlm-citation></ref><ref id="ref50"><label>50</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gao</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Rosas</surname><given-names>JC</given-names> </name><name name-style="western"><surname>Fink</surname><given-names>H</given-names> </name><name name-style="western"><surname>Behrens</surname><given-names>S</given-names> </name><name name-style="western"><surname>Chang-Claude</surname><given-names>J</given-names> </name><name name-style="western"><surname>Seibold</surname><given-names>P</given-names> </name></person-group><article-title>Longitudinal changes of health-related quality of life over 10 years in breast cancer patients treated with radiotherapy following breast-conserving surgery</article-title><source>Qual Life Res</source><year>2023</year><month>09</month><volume>32</volume><issue>9</issue><fpage>2639</fpage><lpage>2652</lpage><pub-id pub-id-type="doi">10.1007/s11136-023-03408-y</pub-id><pub-id pub-id-type="medline">37093543</pub-id></nlm-citation></ref><ref id="ref51"><label>51</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hsu</surname><given-names>T</given-names> </name><name name-style="western"><surname>Ennis</surname><given-names>M</given-names> </name><name name-style="western"><surname>Hood</surname><given-names>N</given-names> </name><name name-style="western"><surname>Graham</surname><given-names>M</given-names> </name><name name-style="western"><surname>Goodwin</surname><given-names>PJ</given-names> </name></person-group><article-title>Quality of life in long-term breast cancer survivors</article-title><source>JCO</source><year>2013</year><month>10</month><day>1</day><volume>31</volume><issue>28</issue><fpage>3540</fpage><lpage>3548</lpage><pub-id pub-id-type="doi">10.1200/JCO.2012.48.1903</pub-id></nlm-citation></ref><ref id="ref52"><label>52</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>de Hond</surname><given-names>AAH</given-names> </name><name name-style="western"><surname>Steyerberg</surname><given-names>EW</given-names> </name><name name-style="western"><surname>van Calster</surname><given-names>B</given-names> </name></person-group><article-title>Interpreting area under the receiver operating characteristic curve</article-title><source>Lancet Digit Health</source><year>2022</year><month>12</month><volume>4</volume><issue>12</issue><fpage>e853</fpage><lpage>e855</lpage><pub-id pub-id-type="doi">10.1016/S2589-7500(22)00188-1</pub-id><pub-id pub-id-type="medline">36270955</pub-id></nlm-citation></ref><ref id="ref53"><label>53</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bower</surname><given-names>JE</given-names> </name></person-group><article-title>Behavioral symptoms in patients with breast cancer and survivors</article-title><source>J Clin Oncol</source><year>2008</year><month>02</month><day>10</day><volume>26</volume><issue>5</issue><fpage>768</fpage><lpage>777</lpage><pub-id pub-id-type="doi">10.1200/JCO.2007.14.3248</pub-id><pub-id pub-id-type="medline">18258985</pub-id></nlm-citation></ref><ref id="ref54"><label>54</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Maass</surname><given-names>SWMC</given-names> </name><name name-style="western"><surname>Brandenbarg</surname><given-names>D</given-names> </name><name name-style="western"><surname>Boerman</surname><given-names>LM</given-names> </name><name name-style="western"><surname>Verhaak</surname><given-names>PFM</given-names> </name><name name-style="western"><surname>de Bock</surname><given-names>GH</given-names> </name><name name-style="western"><surname>Berendsen</surname><given-names>AJ</given-names> </name></person-group><article-title>Fatigue among long-term breast cancer survivors: a controlled cross-sectional study</article-title><source>Cancers (Basel)</source><year>2021</year><month>03</month><day>15</day><volume>13</volume><issue>6</issue><fpage>1301</fpage><pub-id pub-id-type="doi">10.3390/cancers13061301</pub-id><pub-id pub-id-type="medline">33803966</pub-id></nlm-citation></ref><ref id="ref55"><label>55</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Greenlee</surname><given-names>H</given-names> </name><name name-style="western"><surname>DuPont-Reyes</surname><given-names>MJ</given-names> </name><name name-style="western"><surname>Balneaves</surname><given-names>LG</given-names> </name><etal/></person-group><article-title>Clinical practice guidelines on the evidence-based use of integrative therapies during and after breast cancer treatment</article-title><source>CA Cancer J Clin</source><year>2017</year><month>05</month><day>6</day><volume>67</volume><issue>3</issue><fpage>194</fpage><lpage>232</lpage><pub-id pub-id-type="doi">10.3322/caac.21397</pub-id><pub-id pub-id-type="medline">28436999</pub-id></nlm-citation></ref><ref id="ref56"><label>56</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Niculescu-Mizil</surname><given-names>A</given-names> </name><name name-style="western"><surname>Caruana</surname><given-names>R</given-names> </name></person-group><article-title>Predicting good probabilities with supervised learning</article-title><source>Assoc Comput Mach</source><year>2005</year><fpage>625</fpage><lpage>632</lpage><pub-id pub-id-type="doi">10.1145/1102351.1102430</pub-id></nlm-citation></ref><ref id="ref57"><label>57</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Di Meglio</surname><given-names>A</given-names> </name><name name-style="western"><surname>Havas</surname><given-names>J</given-names> </name><name name-style="western"><surname>Soldato</surname><given-names>D</given-names> </name><etal/></person-group><article-title>Development and validation of a predictive model of severe fatigue after breast cancer diagnosis: toward a personalized framework in survivorship care</article-title><source>JCO</source><year>2022</year><month>04</month><day>1</day><volume>40</volume><issue>10</issue><fpage>1111</fpage><lpage>1123</lpage><pub-id pub-id-type="doi">10.1200/JCO.21.01252</pub-id></nlm-citation></ref><ref id="ref58"><label>58</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>R&#x00E9;v&#x00E9;sz</surname><given-names>D</given-names> </name><name name-style="western"><surname>van Kuijk</surname><given-names>SMJ</given-names> </name><name name-style="western"><surname>Mols</surname><given-names>F</given-names> </name><etal/></person-group><article-title>Development and internal validation of prediction models for colorectal cancer survivors to estimate the 1-year risk of low health-related quality of life in multiple domains</article-title><source>BMC Med Inform Decis Mak</source><year>2020</year><month>03</month><day>12</day><volume>20</volume><issue>1</issue><fpage>54</fpage><pub-id pub-id-type="doi">10.1186/s12911-020-1064-9</pub-id><pub-id pub-id-type="medline">32164641</pub-id></nlm-citation></ref><ref id="ref59"><label>59</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Xu</surname><given-names>C</given-names> </name><name name-style="western"><surname>Pfob</surname><given-names>A</given-names> </name><name name-style="western"><surname>Mehrara</surname><given-names>BJ</given-names> </name><etal/></person-group><article-title>Enhanced surgical decision-making tools in breast cancer: predicting 2-year postoperative physical, sexual, and psychosocial well-being following mastectomy and breast reconstruction (INSPiRED 004)</article-title><source>Ann Surg Oncol</source><year>2023</year><month>11</month><volume>30</volume><issue>12</issue><fpage>7046</fpage><lpage>7059</lpage><pub-id pub-id-type="doi">10.1245/s10434-023-13971-w</pub-id><pub-id pub-id-type="medline">37516723</pub-id></nlm-citation></ref><ref id="ref60"><label>60</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bjelic-Radisic</surname><given-names>V</given-names> </name><name name-style="western"><surname>Cardoso</surname><given-names>F</given-names> </name><name name-style="western"><surname>Cameron</surname><given-names>D</given-names> </name><etal/></person-group><article-title>An international update of the EORTC questionnaire for assessing quality of life in breast cancer patients: EORTC QLQ-BR45</article-title><source>Ann Oncol</source><year>2020</year><month>02</month><volume>31</volume><issue>2</issue><fpage>283</fpage><lpage>288</lpage><pub-id pub-id-type="doi">10.1016/j.annonc.2019.10.027</pub-id><pub-id pub-id-type="medline">31959345</pub-id></nlm-citation></ref><ref id="ref61"><label>61</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mittermaier</surname><given-names>M</given-names> </name><name name-style="western"><surname>Raza</surname><given-names>MM</given-names> </name><name name-style="western"><surname>Kvedar</surname><given-names>JC</given-names> </name></person-group><article-title>Bias in AI-based models for medical applications: challenges and mitigation strategies</article-title><source>NPJ Digit Med</source><year>2023</year><month>06</month><day>14</day><volume>6</volume><issue>1</issue><fpage>113</fpage><pub-id pub-id-type="doi">10.1038/s41746-023-00858-z</pub-id><pub-id pub-id-type="medline">37311802</pub-id></nlm-citation></ref><ref id="ref62"><label>62</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Cross</surname><given-names>JL</given-names> </name><name name-style="western"><surname>Choma</surname><given-names>MA</given-names> </name><name name-style="western"><surname>Onofrey</surname><given-names>JA</given-names> </name></person-group><article-title>Bias in medical AI: implications for clinical decision-making</article-title><source>PLOS Digit Health</source><year>2024</year><month>11</month><volume>3</volume><issue>11</issue><fpage>e0000651</fpage><pub-id pub-id-type="doi">10.1371/journal.pdig.0000651</pub-id><pub-id pub-id-type="medline">39509461</pub-id></nlm-citation></ref><ref id="ref63"><label>63</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Whitehead</surname><given-names>M</given-names> </name><name name-style="western"><surname>Carrol</surname><given-names>E</given-names> </name><name name-style="western"><surname>Kee</surname><given-names>F</given-names> </name><name name-style="western"><surname>Holmes</surname><given-names>C</given-names> </name></person-group><article-title>Making the invisible visible: what can we do about biased AI in medical devices?</article-title><source>BMJ</source><year>2023</year><month>08</month><day>16</day><volume>382</volume><fpage>1893</fpage><pub-id pub-id-type="doi">10.1136/bmj.p1893</pub-id></nlm-citation></ref><ref id="ref64"><label>64</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Di Maio</surname><given-names>M</given-names> </name><name name-style="western"><surname>Basch</surname><given-names>E</given-names> </name><name name-style="western"><surname>Denis</surname><given-names>F</given-names> </name><etal/></person-group><article-title>The role of patient-reported outcome measures in the continuum of cancer clinical care: ESMO clinical practice guideline</article-title><source>Ann Oncol</source><year>2022</year><month>09</month><volume>33</volume><issue>9</issue><fpage>878</fpage><lpage>892</lpage><pub-id pub-id-type="doi">10.1016/j.annonc.2022.04.007</pub-id><pub-id pub-id-type="medline">35462007</pub-id></nlm-citation></ref><ref id="ref65"><label>65</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hubel</surname><given-names>NJ</given-names> </name><name name-style="western"><surname>Vorbach</surname><given-names>SM</given-names> </name><name name-style="western"><surname>de Ligt</surname><given-names>KM</given-names> </name><etal/></person-group><article-title>Sustainability and time trends in electronic patient-reported outcome assessment in routine cancer care: systematic scoping review and follow-up survey</article-title><source>J Med Internet Res</source><year>2025</year><month>04</month><day>25</day><volume>27</volume><issue>1</issue><fpage>e69398</fpage><pub-id pub-id-type="doi">10.2196/69398</pub-id><pub-id pub-id-type="medline">40280556</pub-id></nlm-citation></ref><ref id="ref66"><label>66</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mierzynska</surname><given-names>J</given-names> </name><name name-style="western"><surname>Taye</surname><given-names>M</given-names> </name><name name-style="western"><surname>Pe</surname><given-names>M</given-names> </name><etal/></person-group><article-title>Reference values for the EORTC QLQ-C30 in early and metastatic breast cancer</article-title><source>Eur J Cancer</source><year>2020</year><month>01</month><volume>125</volume><fpage>69</fpage><lpage>82</lpage><pub-id pub-id-type="doi">10.1016/j.ejca.2019.10.031</pub-id><pub-id pub-id-type="medline">31838407</pub-id></nlm-citation></ref><ref id="ref67"><label>67</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hollmann</surname><given-names>N</given-names> </name><name name-style="western"><surname>M&#x00FC;ller</surname><given-names>S</given-names> </name><name name-style="western"><surname>Purucker</surname><given-names>L</given-names> </name><etal/></person-group><article-title>Accurate predictions on small data with a tabular foundation model</article-title><source>Nat New Biol</source><year>2025</year><month>01</month><day>9</day><volume>637</volume><issue>8045</issue><fpage>319</fpage><lpage>326</lpage><pub-id pub-id-type="doi">10.1038/s41586-024-08328-6</pub-id></nlm-citation></ref><ref id="ref68"><label>68</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lee</surname><given-names>TC</given-names> </name><name name-style="western"><surname>Shah</surname><given-names>NU</given-names> </name><name name-style="western"><surname>Haack</surname><given-names>A</given-names> </name><name name-style="western"><surname>Baxter</surname><given-names>SL</given-names> </name></person-group><article-title>Clinical implementation of predictive models embedded within electronic health record systems: a systematic review</article-title><source>Informatics (MDPI)</source><year>2020</year><month>09</month><volume>7</volume><issue>3</issue><fpage>25</fpage><pub-id pub-id-type="doi">10.3390/informatics7030025</pub-id></nlm-citation></ref><ref id="ref69"><label>69</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Spencer</surname><given-names>KL</given-names> </name><name name-style="western"><surname>Absolom</surname><given-names>KL</given-names> </name><name name-style="western"><surname>Allsop</surname><given-names>MJ</given-names> </name><etal/></person-group><article-title>Fixing the leaky pipe: how to improve the uptake of patient-reported outcomes-based prognostic and predictive models in cancer clinical practice</article-title><source>JCO Clin Cancer Inform</source><year>2023</year><month>09</month><volume>7</volume><issue>7</issue><fpage>e2300070</fpage><pub-id pub-id-type="doi">10.1200/CCI.23.00070</pub-id><pub-id pub-id-type="medline">37976441</pub-id></nlm-citation></ref><ref id="ref70"><label>70</label><nlm-citation citation-type="web"><article-title>BALANCE-ML</article-title><source>GitHub</source><access-date>2026-04-14</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://github.com/NJHubel/BALANCE-ML/blob/main/README.md">https://github.com/NJHubel/BALANCE-ML/blob/main/README.md</ext-link></comment></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Multimedia Appendix 1</label><p>Tables, figures, and more on the data in this paper.</p><media xlink:href="jmir_v28i1e81424_app1.pdf" xlink:title="PDF File, 7678 KB"/></supplementary-material></app-group></back></article>