<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMIR</journal-id>
      <journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id>
      <journal-title>Journal of Medical Internet Research</journal-title>
      <issn pub-type="epub">1438-8871</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v27i1e77721</article-id>
      <article-id pub-id-type="pmid">41191908</article-id>
      <article-id pub-id-type="doi">10.2196/77721</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Viewpoint</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Viewpoint</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Beyond Comparing Machine Learning and Logistic Regression in Clinical Prediction Modelling: Shifting from Model Debate to Data Quality</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Mavragani</surname>
            <given-names>Amaryllis</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Silvey</surname>
            <given-names>Scott</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Li</surname>
            <given-names>Jieni</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Hu</surname>
            <given-names>Yanan</given-names>
          </name>
          <degrees>BCom</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Monash Centre for Health Research and Implementation</institution>
            <institution>Faculty of Medicine, Nursing and Health Sciences</institution>
            <institution>Monash University</institution>
            <addr-line>43-51 Kanooka Grove</addr-line>
            <addr-line>Melbourne, 3168</addr-line>
            <country>Australia</country>
            <phone>61 438555775</phone>
            <email>yanan.hu@monash.edu</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-1794-7789</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Zhang</surname>
            <given-names>Xin</given-names>
          </name>
          <degrees>BEng, MEng, PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-0675-6891</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Slavin</surname>
            <given-names>Valerie</given-names>
          </name>
          <degrees>BSc, PhD</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <xref rid="aff4" ref-type="aff">4</xref>
          <xref rid="aff5" ref-type="aff">5</xref>
          <xref rid="aff6" ref-type="aff">6</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-7688-2498</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Belsti</surname>
            <given-names>Yitayeh</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-8984-1495</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Tiruneh</surname>
            <given-names>Sofonyas Abebaw</given-names>
          </name>
          <degrees>MPH</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-5867-5105</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author">
          <name name-style="western">
            <surname>Callander</surname>
            <given-names>Emily</given-names>
          </name>
          <degrees>BA, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff7" ref-type="aff">7</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-7233-6804</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author">
          <name name-style="western">
            <surname>Enticott</surname>
            <given-names>Joanne</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-4480-5690</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Monash Centre for Health Research and Implementation</institution>
        <institution>Faculty of Medicine, Nursing and Health Sciences</institution>
        <institution>Monash University</institution>
        <addr-line>Melbourne</addr-line>
        <country>Australia</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Department of Electrical and Computer Systems Engineering</institution>
        <institution>Monash University</institution>
        <addr-line>Melbourne</addr-line>
        <country>Australia</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Gold Coast Hospital and Health Service</institution>
        <institution>Gold Coast Hospital</institution>
        <addr-line>Gold Coast</addr-line>
        <country>Australia</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>School of Nursing and Midwifery</institution>
        <institution>Griffith University</institution>
        <addr-line>Gold Coast</addr-line>
        <country>Australia</country>
      </aff>
      <aff id="aff5">
        <label>5</label>
        <institution>School of Nursing and Midwifery</institution>
        <institution>University of Technology Sydney</institution>
        <addr-line>Sydney</addr-line>
        <country>Australia</country>
      </aff>
      <aff id="aff6">
        <label>6</label>
        <institution>School of Nursing, Midwifery and Social Work</institution>
        <institution>The University of Queensland</institution>
        <addr-line>Brisbane</addr-line>
        <country>Australia</country>
      </aff>
      <aff id="aff7">
        <label>7</label>
        <institution>School of Public Health</institution>
        <institution>University of Technology Sydney</institution>
        <addr-line>Sydney</addr-line>
        <country>Australia</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Yanan Hu <email>yanan.hu@monash.edu</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2025</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>5</day>
        <month>11</month>
        <year>2025</year>
      </pub-date>
      <volume>27</volume>
      <elocation-id>e77721</elocation-id>
      <history>
        <date date-type="received">
          <day>19</day>
          <month>5</month>
          <year>2025</year>
        </date>
        <date date-type="rev-request">
          <day>24</day>
          <month>7</month>
          <year>2025</year>
        </date>
        <date date-type="rev-recd">
          <day>28</day>
          <month>7</month>
          <year>2025</year>
        </date>
        <date date-type="accepted">
          <day>14</day>
          <month>8</month>
          <year>2025</year>
        </date>
      </history>
      <copyright-statement>©Yanan Hu, Xin Zhang, Valerie Slavin, Yitayeh Belsti, Sofonyas Abebaw Tiruneh, Emily Callander, Joanne Enticott. Originally published in the Journal of Medical Internet Research (https://www.jmir.org), 05.11.2025.</copyright-statement>
      <copyright-year>2025</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research (ISSN 1438-8871), is properly cited. The complete bibliographic information, a link to the original publication on https://www.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://www.jmir.org/2025/1/e77721" xlink:type="simple"/>
      <abstract>
        <p>The rapid uptake of supervised machine learning (ML) in clinical prediction modelling, particularly for binary outcomes based on tabular data, has sparked debate about its comparative advantage over traditional statistical logistic regression. Although ML has demonstrated superiority in unstructured data domains, its performance gains in structured, tabular clinical datasets remain inconsistent and context dependent. This viewpoint synthesizes recent comparative studies and simulation findings to argue that there is no universal best modelling approach. Model performance depends heavily on dataset characteristics (eg, linearity, sample size, number of candidate predictors, minority class proportion) and data quality (eg, completeness, accuracy). Consequently, we argue that efforts to improve data quality, not model complexity, are more likely to enhance the reliability and real-world utility of clinical prediction models.</p>
      </abstract>
      <kwd-group>
        <kwd>machine learning</kwd>
        <kwd>clinical prediction models</kwd>
        <kwd>logistic regression</kwd>
        <kwd>clinical data</kwd>
        <kwd>data quality</kwd>
        <kwd>binary classfication</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>The increasing adoption of supervised machine learning (ML) in clinical prediction models (diagnostic or prognostic) based on tabular data has sparked considerable debate regarding its comparative performance against traditional statistical logistic regression (LR), particularly for binary outcomes such as mortality or the occurrence of adverse events [<xref ref-type="bibr" rid="ref1">1</xref>]. Although supervised ML approaches have demonstrated clear superiority in classifying unstructured clinical data such as medical images and texts [<xref ref-type="bibr" rid="ref2">2</xref>], their added value for the classification of clinical tabular data, where structured data are organized in tables, typically with rows representing individual cases and columns representing individual characteristics, remains uncertain and context-dependent [<xref ref-type="bibr" rid="ref3">3</xref>].</p>
    </sec>
    <sec sec-type="Definition of Statistical LR Versus ML-Based LR">
      <title>Definition of Statistical LR Versus ML-Based LR</title>
      <p>The distinction between statistical LR and ML-based LR is frequently blurred in both literature and practice [<xref ref-type="bibr" rid="ref1">1</xref>]. Many studies loosely refer to any penalized LR model as ML, despite fundamental methodological differences. To enable valid comparisons between these approaches, it is therefore crucial to clearly delineate their boundaries (<xref ref-type="table" rid="table1">Table 1</xref>).</p>
      <table-wrap position="float" id="table1">
        <label>Table 1</label>
        <caption>
          <p>Definitions of statistical logistic regression and machine learning–based logistic regression.</p>
        </caption>
        <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="150"/>
          <col width="850"/>
          <thead>
            <tr valign="top">
              <td>Method</td>
              <td>Definition</td>
            </tr>
          </thead>
          <tbody>
            <tr valign="top">
              <td>Statistical logistic  <break/>  
            regression</td>
              <td>A parametric model operating under conventional statistical assumptions, including linearity and independence, employing fixed hyperparameters without data-driven optimization, using prespecified candidate predictors based on clinical or theoretical justification. This aligns with traditional epidemiological approaches where model specification precedes data analysis.</td>
            </tr>
            <tr valign="top">
              <td>Machine learning–based logistic regression</td>
              <td>An adaptive variant where model specification becomes part of the analytical process itself, hyperparameters like penalty terms are tuned through cross-validation, predictors may be selected algorithmically from a broader set of candidates, and the analytical focus shifts decisively toward predictive performance. While mathematically similar to statistical logistic regression, this approach embodies the machine learning philosophy of learning from data.</td>
            </tr>
          </tbody>
        </table>
      </table-wrap>
      <p>In this paper, we adopt the definition proposed in a previous systematic review [<xref ref-type="bibr" rid="ref1">1</xref>], which characterizes statistical LR as a theory-based model that operates under strict assumptions and does not involve data-driven optimization of predictive performance through hyperparameter tuning but relies on subject knowledge from researchers or experts to specify the model structure. Although penalized LR models may involve hyperparameter tuning and variable selection, they remain theory-involved and do not intrinsically capture nonlinearities or interactions, and the core assumptions of LR still apply. Conversely, ML models are defined as methods that autonomously learn patterns from data (ie, data-driven hyperparameter tuning or predictor selection) [<xref ref-type="bibr" rid="ref4">4</xref>], including ML-based LR and other supervised ML methods (eg, random forest, boosting, neural networks, support vector machine) that intrinsically handle complex interactions without manual specification beforehand.</p>
    </sec>
    <sec sec-type="Comparative Performance: What Was Already Known">
      <title>Comparative Performance: What Was Already Known</title>
      <p>A 2019 meta-regression of 145 low-risk-of-bias comparisons between statistical LR and ML binary clinical prediction models on tabular data showed no performance benefit of ML over statistical LR [<xref ref-type="bibr" rid="ref1">1</xref>]. However, this comparison was limited to discrimination measured by the area under the receiver operating characteristic curve (AUROC), as other performance metrics were not frequently reported. Notably, 79% (56/71) of the studies did not report calibration performance, and only one study reported clinical utility. Clinical utility is commonly assessed through decision curve analysis, which estimates the clinical value of a prediction model at the population level by considering the consequences of decisions made based on its output [<xref ref-type="bibr" rid="ref5">5</xref>], specifically, the benefit of correctly predicting true positives and the harm of incorrectly predicting false positives. A step-by-step guide to this method is available here [<xref ref-type="bibr" rid="ref6">6</xref>].</p>
      <p>Each performance metric captures a distinct aspect of model performance, with its own strengths and limitations. A model may achieve a high AUROC yet still have poor calibration and potentially harmful clinical consequences if the predicted probabilities are systematically overestimated or underestimated; vice versa, a well-calibrated model may still have poor discriminative ability. This highlights the need for comprehensive evaluation across multiple performance domains, including discrimination, calibration, classification metrics, clinical utility, and fairness. Therefore, focusing solely on marginal gains in AUROC between LR and ML can be misleading and inadequate for guiding future research.</p>
      <p>Furthermore, the meta-regression of AUROC did not explore the underlying sources of performance differences (eg, sample size, number of predictors, use of hyperparameter tuning). Therefore, it is still unclear whether the observed variation in performance reflects true algorithmic superiority or is instead driven by dataset characteristics or modelling procedures. For example, the systematic review highlighted that more than half of the included studies did not clearly report their hyperparameter tuning strategies.</p>
      <p>The comparison should not only focus on the difference in performance but also on the stability of performance [<xref ref-type="bibr" rid="ref7">7</xref>]. Even when statistical LR outperforms ML in certain metrics (eg, AUROC), this does not necessarily imply that the predictions are stable or reproducible, that is, applying the same model development procedure to different samples of the same size drawn from the same underlying population can result in substantially different predictions for the same individual. This issue is particularly pronounced when using small development datasets, which leads to more different models in the multiverse, often with vastly unstable individual predictions [<xref ref-type="bibr" rid="ref8">8</xref>]. Adherence to the minimum sample size recommendations is one way to mitigate this issue [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref10">10</xref>]. Notably, a 2023 systematic review reported that 73% of the binary clinical prediction models using statistical LR had sample sizes below the recommended minimum threshold [<xref ref-type="bibr" rid="ref11">11</xref>]. ML algorithms are generally more data-hungry than LR to achieve stable performance. For example, one study demonstrated that random forest may require more than 20 times the number of events for each candidate predictor compared to statistical LR [<xref ref-type="bibr" rid="ref10">10</xref>].</p>
    </sec>
    <sec sec-type="Research Recommendation for Reporting: Improving the Transparency of Each Step">
      <title>Research Recommendation for Reporting: Improving the Transparency of Each Step</title>
      <p>In light of the methodological issues identified in the current literature rather than focusing solely on determining the inherent superiority of one modelling approach over another, greater attention should be directed toward ensuring the rigor and transparency of modelling procedures. This includes clear documentation of data preprocessing steps, sample size justifications, modelling decisions, hyperparameter tuning strategies (eg, grid or random search), feature selection techniques (including filter methods like correlation analysis, wrapper methods like recursive feature elimination, or embedded methods such as least absolute shrinkage and selection operator [LASSO]), model performance evaluation methods and metrics, and model explanation methods (eg, Shapley Additive Explanations [SHAP] [<xref ref-type="bibr" rid="ref12">12</xref>], Submodular Pick Local Interpretable Model-agnostic Explanations [SP-LIME] [<xref ref-type="bibr" rid="ref13">13</xref>], and Counterfactual Explanations for Robustness, Transparency, Interpretability, and Fairness of Artificial Intelligence [CERTIFAI] models [<xref ref-type="bibr" rid="ref14">14</xref>]).</p>
    </sec>
    <sec sec-type="No Free Lunch Theorem">
      <title>No Free Lunch Theorem</title>
      <p>There is no universal golden method for clinical prediction models [<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref16">16</xref>] and whether the benefit of each algorithm (either statistical or ML) can be fulfilled is highly subject to the dataset characteristics (eg, sample size, class imbalance, nonlinearity, number of candidate predictors [<xref ref-type="bibr" rid="ref10">10</xref>]) and data quality (eg, completeness, accuracy [<xref ref-type="bibr" rid="ref17">17</xref>]).</p>
      <p>Each algorithm has its unique strengths and limitations in handling different data characteristics (<xref ref-type="table" rid="table2">Table 2</xref>). For example, Categorical Boosting is particularly effective for datasets with high-cardinality categorical variables, as it includes built-in techniques to encode categories without extensive preprocessing [<xref ref-type="bibr" rid="ref18">18</xref>]. eXtreme Gradient Boosting [<xref ref-type="bibr" rid="ref19">19</xref>] and Light Gradient-Boosting Machine [<xref ref-type="bibr" rid="ref20">20</xref>] are known for their computational efficiency, performance in data with complex feature interactions, and native handling of missing data, but are less interpretable than LR. Deep learning, a subfield of ML, uses multilayered neural networks to simulate human decision-making [<xref ref-type="bibr" rid="ref21">21</xref>]. While capable of learning highly complex nonlinear relationships from extremely large and high-dimensional datasets, deep learning models are generally more data-hungry, less interpretable, and require significantly more computational resources than traditional ML methods, which may limit their transparency and clinical applicability [<xref ref-type="bibr" rid="ref22">22</xref>]. Although efforts in Explainable Artificial Intelligence (XAI) are advancing, current ML models often fall short of the level of clarity and trust required for clinical implementation [<xref ref-type="bibr" rid="ref23">23</xref>]. On the other hand, LR is highly interpretable and performs well on small sample sizes when predictors have an approximately linear relationship with the outcome, but it may struggle with complex nonlinearities or large numbers of correlated predictors. The smaller the sample size available, the more we must rely on external information or inputs from experts to determine the features/predictors.</p>
      <table-wrap position="float" id="table2">
        <label>Table 2</label>
        <caption>
          <p>Strengths and weaknesses of statistical logistic regression and machine learning in binary clinical prediction models based on tabular data.</p>
        </caption>
        <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="250"/>
          <col width="400"/>
          <col width="350"/>
          <thead>
            <tr valign="top">
              <td>Aspect</td>
              <td>Statistical logistic regression</td>
              <td>Supervised machine learning</td>
            </tr>
          </thead>
          <tbody>
            <tr valign="top">
              <td>Learning process</td>
              <td>Theory-driven; relies on expert knowledge for model specification and candidate predictor selection</td>
              <td>Data-driven; directly and automatically learn relationship from data</td>
            </tr>
            <tr valign="top">
              <td>Assumptions in data structure</td>
              <td>High (eg, interactions, linearity)</td>
              <td>Low; handle complex, nonlinear relationship</td>
            </tr>
            <tr valign="top">
              <td>Assumptions in model specification</td>
              <td>High; use default value</td>
              <td>Low; data-driven hyperparameter tuning</td>
            </tr>
            <tr valign="top">
              <td>User input in creation and selection of candidate predictors</td>
              <td>High; researchers need to investigate the nonlinearity of continuous variables and interaction effects and systematic review or expert opinion of candidate predictors before developing the model</td>
              <td>Low; models automatically capture nonlinearity and interactions, no need for researchers to investigate nonlinearity and interaction effects between variables</td>
            </tr>
            <tr valign="top">
              <td>Flexibility</td>
              <td>Low; constrained by linearity assumptions but can be improved by adding penalty</td>
              <td>High</td>
            </tr>
            <tr valign="top">
              <td>Complexity</td>
              <td>Low; simple, parametric model</td>
              <td>High</td>
            </tr>
            <tr valign="top">
              <td>Performance on complex data</td>
              <td>Low</td>
              <td>High</td>
            </tr>
            <tr valign="top">
              <td>Sample size requirement for stable performance</td>
              <td>Low</td>
              <td>High; data-hungriness</td>
            </tr>
            <tr valign="top">
              <td>Interpretability (in-processing decision-making process)</td>
              <td>High; white-box nature, model coefficients are directly interpretable, can also be presented using graphical score charts or nomograms</td>
              <td>Low; black-box nature, decision-making process is not transparent</td>
            </tr>
            <tr valign="top">
              <td>Explainability (postprocessing explanation)</td>
              <td>High</td>
              <td>Low; complex to explain to end users, requires post hoc methods like Shapley Additive Explanations for explanation</td>
            </tr>
            <tr valign="top">
              <td>Deployment ease</td>
              <td>High</td>
              <td>Low</td>
            </tr>
            <tr valign="top">
              <td>Computational cost</td>
              <td>Low</td>
              <td>High</td>
            </tr>
          </tbody>
        </table>
      </table-wrap>
      <p>Therefore, the choice of the algorithm should be tailored to the structure, quality, and characteristics of the dataset. Ultimately, the development of clinical prediction models involves unavoidable trade-offs. There is no single algorithm that excels across all performance metrics (fairness, accuracy, generalizability, stability, parsimony, and interpretability). Researchers must prioritize certain metrics depending on the model’s intended application and target population. For instance, model parsimony, where a model with fewer predictors may sacrifice some accuracy for simplicity, can be crucial in enhancing user acceptance, as overly complex models may reduce usability. Additionally, discussions with stakeholders (eg, health care providers, patients) regarding the most relevant features or desired trade-offs can guide model development.</p>
      <p>Clinical tabular datasets often exhibit characteristics that tend to favor LR over ML models [<xref ref-type="bibr" rid="ref9">9</xref>]. These include small to moderate sample sizes, relatively high levels of noise, a limited number of candidate predictors (ie, low dimension), and typically binary outcomes (<xref ref-type="table" rid="table3">Table 3</xref>). Such conditions can constrain the ability of complex ML algorithms to demonstrate superior performance. Moreover, LR’s well-recognized interpretability and trustworthiness [<xref ref-type="bibr" rid="ref24">24</xref>] further reinforce its widespread use in clinical prediction modelling, and it is typically used as a reference model for performance benchmarking in ML studies. However, ML approaches may warrant consideration when they demonstrate clear superiority in performance, supported by model explainability to help build trust among clinicians and end users. To date, no consensus exists on how to evaluate or compare model interpretability and explainability across different methods [<xref ref-type="bibr" rid="ref23">23</xref>].</p>
      <table-wrap position="float" id="table3">
        <label>Table 3</label>
        <caption>
          <p>Mismatches between the characteristics of clinical data and supervised machine learning’s strengths.</p>
        </caption>
        <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="120"/>
          <col width="300"/>
          <col width="280"/>
          <col width="300"/>
          <thead>
            <tr valign="top">
              <td>Aspect</td>
              <td>Characteristics in clinical data</td>
              <td>Supervised machine learning’s relative strength compared to statistical logistic regression</td>
              <td>Comments</td>
            </tr>
          </thead>
          <tbody>
            <tr valign="top">
              <td>Data modality</td>
              <td>Mostly single modal data (tabular data)</td>
              <td>Excels with multimodal data (image, scan, text, or signal)</td>
              <td>Clinical datasets often lack the multimodal richness that enables ML<sup>a</sup> models to fully demonstrate their advantages</td>
            </tr>
            <tr valign="top">
              <td>Data quality</td>
              <td>High noise due to errors, missingness, or inconsistent measurement (low signal-to-noise ratio)</td>
              <td>Performs better for data with high signal-to-noise ratio</td>
              <td>Noise dilutes true signals, and ML models tend to overfit to noisy artifacts without careful data preprocessing</td>
            </tr>
            <tr valign="top">
              <td>Sample size</td>
              <td>Often small to moderate</td>
              <td>Benefit from large-scale datasets. More “data-hungry”</td>
              <td>Although sample sizes are improving in some registries, they are often insufficient to train complex ML architectures robustly</td>
            </tr>
            <tr valign="top">
              <td>Predictors</td>
              <td>Typically, a small set of clinically meaningful predictors with high linearity and low order of interaction terms</td>
              <td>Excels with high-dimensional, nonlinear interactions, temporally rich data</td>
              <td>ML's strength in handling high-dimensional, time-series data with higher nonlinearity and interaction terms</td>
            </tr>
            <tr valign="top">
              <td>Prediction</td>
              <td>Predominantly binary classification (eg, event occurrence: yes/no).</td>
              <td>Advantage in multiclass classification and regression</td>
              <td>Simple binary classification problems often diminish the additional complexity that ML can handle</td>
            </tr>
          </tbody>
        </table>
        <table-wrap-foot>
          <fn id="table3fn1">
            <p><sup>a</sup>ML: machine learning.</p>
          </fn>
        </table-wrap-foot>
      </table-wrap>
    </sec>
    <sec sec-type="Policy and Research Recommendation: Shifting From Model Debate to Data Quality">
      <title>Policy and Research Recommendation: Shifting From Model Debate to Data Quality</title>
      <p>Amid increasing interest in complex models, it is crucial to reorient clinical prediction modelling from a model-centric to a data-centric paradigm [<xref ref-type="bibr" rid="ref25">25</xref>]. The quality, structure, and representativeness of data are far more critical to model performance than the complexity of models. In clinical settings, prediction models serve best as a second set of eyes, complementing clinical judgment rather than replacing it [<xref ref-type="bibr" rid="ref23">23</xref>]. However, without high-quality data, even the most sophisticated models will propagate existing biases and limitations, as the saying goes, “garbage in, garbage out.”</p>
      <p>As the number of clinical prediction models continues to grow, policymakers and funding bodies should prioritize investment in data quality infrastructure, including standardized phenotyping, consistent variable definitions, and robust data curation practices. Since all models are trained on historical data that inherently reflect systemic limitations, model complexity cannot resolve errors rooted in the data; in fact, they might amplify the bias and make unfair decisions in underrepresented or marginal groups such as defined by sex, ethnicity, or deprivation [<xref ref-type="bibr" rid="ref26">26</xref>]. In contrast, thoughtful data preprocessing and transparent reporting of modelling strategies are foundational to developing reliable, generalizable, reproducible, and trustworthy decision support tools [<xref ref-type="bibr" rid="ref27">27</xref>]. In addition, more effort is needed to expand the candidate predictors available in health data [<xref ref-type="bibr" rid="ref26">26</xref>], such as integrating lifestyle factors collected through wearables and a range of medical devices [<xref ref-type="bibr" rid="ref28">28</xref>].</p>
      <p>This shift in emphasis from modelling sophistication to data stewardship is essential to ensure that clinical prediction tools genuinely enhance, rather than undermine, the quality and equity of patient-centered care.</p>
    </sec>
  </body>
  <back>
    <app-group/>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">AUROC</term>
          <def>
            <p>area under the receiver operating characteristic curve</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">CERTIFAI</term>
          <def>
            <p>Counterfactual Explanations for Robustness, Transparency, Interpretability, and Fairness of Artificial Intelligence</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">LASSO</term>
          <def>
            <p>least absolute shrinkage and selection operator</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">LR</term>
          <def>
            <p>logistic regression</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">ML</term>
          <def>
            <p>machine learning</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">SHAP</term>
          <def>
            <p>Shapley Additive Explanations</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">SP-LIME</term>
          <def>
            <p>Submodular Pick Local Interpretable Model-agnostic Explanations</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">XAI</term>
          <def>
            <p>Explainable Artificial Intelligence</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Christodoulou</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Ma</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Collins</surname>
              <given-names>GS</given-names>
            </name>
            <name name-style="western">
              <surname>Steyerberg</surname>
              <given-names>EW</given-names>
            </name>
            <name name-style="western">
              <surname>Verbakel</surname>
              <given-names>JY</given-names>
            </name>
            <name name-style="western">
              <surname>Van Calster</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>A systematic review shows no performance benefit of machine learning over logistic regression for clinical prediction models</article-title>
          <source>J Clin Epidemiol</source>
          <year>2019</year>
          <month>06</month>
          <volume>110</volume>
          <fpage>12</fpage>
          <lpage>22</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jclinepi.2019.02.004</pub-id>
          <pub-id pub-id-type="medline">30763612</pub-id>
          <pub-id pub-id-type="pii">S0895-4356(18)31081-3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chakraborty</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Bhattacharya</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Pal</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>From machine learning to deep learning: advances of the recent data-driven paradigm shift in medicine and healthcare</article-title>
          <source>Current Research in Biotechnology</source>
          <year>2024</year>
          <volume>7</volume>
          <fpage>100164</fpage>
          <pub-id pub-id-type="doi">10.1016/j.crbiot.2023.100164</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mann</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Lyons</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>O'Rourke</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Davies</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Machine learning or traditional statistical methods for predictive modelling in perioperative medicine: a narrative review</article-title>
          <source>J Clin Anesth</source>
          <year>2025</year>
          <month>03</month>
          <volume>102</volume>
          <fpage>111782</fpage>
          <pub-id pub-id-type="doi">10.1016/j.jclinane.2025.111782</pub-id>
          <pub-id pub-id-type="medline">39977974</pub-id>
          <pub-id pub-id-type="pii">S0952-8180(25)00042-X</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Breiman</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Statistical modeling: the two cultures (with comments and a rejoinder by the author)</article-title>
          <source>Statist Sci</source>
          <year>2001</year>
          <month>8</month>
          <day>1</day>
          <volume>16</volume>
          <issue>3</issue>
          <fpage>199</fpage>
          <lpage>231</lpage>
          <pub-id pub-id-type="doi">10.1214/ss/1009213726</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vickers</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Elkin</surname>
              <given-names>EB</given-names>
            </name>
          </person-group>
          <article-title>Decision curve analysis: a novel method for evaluating prediction models</article-title>
          <source>Med Decis Making</source>
          <year>2006</year>
          <month>11</month>
          <day>01</day>
          <volume>26</volume>
          <issue>6</issue>
          <fpage>565</fpage>
          <lpage>574</lpage>
          <pub-id pub-id-type="doi">10.1177/0272989x06295361</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vickers</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>van Calster</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Steyerberg</surname>
              <given-names>EW</given-names>
            </name>
          </person-group>
          <article-title>A simple, step-by-step guide to interpreting decision curve analysis</article-title>
          <source>Diagn Progn Res</source>
          <year>2019</year>
          <volume>3</volume>
          <issue>1</issue>
          <fpage>18</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/31592444"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s41512-019-0064-7</pub-id>
          <pub-id pub-id-type="medline">31592444</pub-id>
          <pub-id pub-id-type="pii">64</pub-id>
          <pub-id pub-id-type="pmcid">PMC6777022</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Riley</surname>
              <given-names>RD</given-names>
            </name>
            <name name-style="western">
              <surname>Collins</surname>
              <given-names>GS</given-names>
            </name>
          </person-group>
          <article-title>Stability of clinical prediction models developed using statistical or machine learning methods</article-title>
          <source>Biom J</source>
          <year>2023</year>
          <month>12</month>
          <volume>65</volume>
          <issue>8</issue>
          <fpage>e2200302</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/37466257"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/bimj.202200302</pub-id>
          <pub-id pub-id-type="medline">37466257</pub-id>
          <pub-id pub-id-type="pmcid">PMC10952221</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Riley</surname>
              <given-names>RD</given-names>
            </name>
            <name name-style="western">
              <surname>Pate</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Dhiman</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Archer</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Martin</surname>
              <given-names>GP</given-names>
            </name>
            <name name-style="western">
              <surname>Collins</surname>
              <given-names>GS</given-names>
            </name>
          </person-group>
          <article-title>Clinical prediction models and the multiverse of madness</article-title>
          <source>BMC Med</source>
          <year>2023</year>
          <month>12</month>
          <day>18</day>
          <volume>21</volume>
          <issue>1</issue>
          <fpage>502</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedicine.biomedcentral.com/articles/10.1186/s12916-023-03212-y"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12916-023-03212-y</pub-id>
          <pub-id pub-id-type="medline">38110939</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12916-023-03212-y</pub-id>
          <pub-id pub-id-type="pmcid">PMC10729337</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Riley</surname>
              <given-names>RD</given-names>
            </name>
            <name name-style="western">
              <surname>Ensor</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Snell</surname>
              <given-names>KIE</given-names>
            </name>
            <name name-style="western">
              <surname>Harrell</surname>
              <given-names>FE</given-names>
            </name>
            <name name-style="western">
              <surname>Martin</surname>
              <given-names>GP</given-names>
            </name>
            <name name-style="western">
              <surname>Reitsma</surname>
              <given-names>JB</given-names>
            </name>
            <name name-style="western">
              <surname>Moons</surname>
              <given-names>KGM</given-names>
            </name>
            <name name-style="western">
              <surname>Collins</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>van Smeden</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Calculating the sample size required for developing a clinical prediction model</article-title>
          <source>BMJ</source>
          <year>2020</year>
          <month>03</month>
          <day>18</day>
          <volume>368</volume>
          <fpage>m441</fpage>
          <pub-id pub-id-type="doi">10.1136/bmj.m441</pub-id>
          <pub-id pub-id-type="medline">32188600</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Silvey</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Sample size requirements for popular classification algorithms in tabular clinical data: empirical study</article-title>
          <source>J Med Internet Res</source>
          <year>2024</year>
          <month>12</month>
          <day>17</day>
          <volume>26</volume>
          <fpage>e60231</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2024//e60231/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/60231</pub-id>
          <pub-id pub-id-type="medline">39689306</pub-id>
          <pub-id pub-id-type="pii">v26i1e60231</pub-id>
          <pub-id pub-id-type="pmcid">PMC11688588</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <collab>Dhiman</collab>
            <name name-style="western">
              <surname>Ma</surname>
              <given-names>Jie</given-names>
            </name>
            <name name-style="western">
              <surname>Qi</surname>
              <given-names>Cathy</given-names>
            </name>
            <name name-style="western">
              <surname>Bullock</surname>
              <given-names>Garrett</given-names>
            </name>
            <name name-style="western">
              <surname>Sergeant</surname>
              <given-names>Jamie C</given-names>
            </name>
            <name name-style="western">
              <surname>Riley</surname>
              <given-names>Richard D</given-names>
            </name>
            <name name-style="western">
              <surname>Collins</surname>
              <given-names>Gary S</given-names>
            </name>
          </person-group>
          <article-title>Sample size requirements are not being considered in studies developing prediction models for binary outcomes: a systematic review</article-title>
          <source>BMC Med Res Methodol</source>
          <year>2023</year>
          <month>08</month>
          <day>19</day>
          <volume>23</volume>
          <issue>1</issue>
          <fpage>188</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedresmethodol.biomedcentral.com/articles/10.1186/s12874-023-02008-1"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12874-023-02008-1</pub-id>
          <pub-id pub-id-type="medline">37598153</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12874-023-02008-1</pub-id>
          <pub-id pub-id-type="pmcid">PMC10439652</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lundberg</surname>
              <given-names>Scott M</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>Su-In</given-names>
            </name>
          </person-group>
          <article-title>A unified approach to interpreting model predictions</article-title>
          <source>ArXiv. Preprint posted online on November 25, 2017</source>
          <year>2017</year>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/1705.07874"/>
          </comment>
          <pub-id pub-id-type="doi">10.48550/arXiv.1705.07874</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ribeiro</surname>
              <given-names>Marco Tulio</given-names>
            </name>
            <name name-style="western">
              <surname>Singh</surname>
              <given-names>Sameer</given-names>
            </name>
            <name name-style="western">
              <surname>Guestrin</surname>
              <given-names>Carlos</given-names>
            </name>
          </person-group>
          <article-title>"Why should I trust you?": explaining the predictions of any classifier</article-title>
          <year>2016</year>
          <month>08</month>
          <day>13</day>
          <conf-name>Proceedings of the 22nd ACM SIGKDD International Conference on Knowledge Discovery and Data Mining</conf-name>
          <conf-date>2016</conf-date>
          <conf-loc>San Francisco, California, USA</conf-loc>
          <fpage>1135</fpage>
          <lpage>1144</lpage>
          <pub-id pub-id-type="doi">https://doi.org/10.1145/2939672.2939778</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sharma</surname>
              <given-names>Shubham</given-names>
            </name>
            <name name-style="western">
              <surname>Henderson</surname>
              <given-names>Jette</given-names>
            </name>
            <name name-style="western">
              <surname>Ghosh</surname>
              <given-names>Joydeep</given-names>
            </name>
          </person-group>
          <article-title>CERTIFAI: a common framework to provide explanations and analyse the fairness and robustness of black-box models</article-title>
          <year>2020</year>
          <month>02</month>
          <day>07</day>
          <conf-name>Proceedings of the AAAI/ACM Conference on AI, Ethics, and Society</conf-name>
          <conf-date>February 7</conf-date>
          <conf-loc>New York, NY, USA</conf-loc>
          <fpage>166</fpage>
          <lpage>172</lpage>
          <pub-id pub-id-type="doi">10.1145/3375627.3375812</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wolpert</surname>
              <given-names>DH</given-names>
            </name>
          </person-group>
          <article-title>The supervised learning no-free-lunch theorems</article-title>
          <source>Soft Computing and Industry</source>
          <year>2002</year>
          <publisher-loc>London</publisher-loc>
          <publisher-name>Springer</publisher-name>
          <fpage>25</fpage>
          <lpage>42</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fernández-Delgado</surname>
              <given-names>Manuel</given-names>
            </name>
            <name name-style="western">
              <surname>Cernadas</surname>
              <given-names>Eva</given-names>
            </name>
            <name name-style="western">
              <surname>Barro</surname>
              <given-names>Senén</given-names>
            </name>
            <name name-style="western">
              <surname>Amorim</surname>
              <given-names>Dinani</given-names>
            </name>
          </person-group>
          <article-title>Do we need hundreds of classifiers to solve real world classification problems?</article-title>
          <source>JMLR</source>
          <year>2014</year>
          <access-date>2025-11-03</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://jmlr.org/papers/volume15/delgado14a/delgado14a.pdf">https://jmlr.org/papers/volume15/delgado14a/delgado14a.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mohammed</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Budach</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Feuerpfeil</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ihde</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Nathansen</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Noack</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Patzlaff</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Naumann</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Harmouch</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>The effects of data quality on machine learning performance on tabular data</article-title>
          <source>Information Systems</source>
          <year>2025</year>
          <month>07</month>
          <volume>132</volume>
          <fpage>102549</fpage>
          <pub-id pub-id-type="doi">10.1016/j.is.2025.102549</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Prokhorenkova</surname>
              <given-names>Liudmila</given-names>
            </name>
            <name name-style="western">
              <surname>Gusev</surname>
              <given-names>Gleb</given-names>
            </name>
            <name name-style="western">
              <surname>Vorobev</surname>
              <given-names>Aleksandr</given-names>
            </name>
            <name name-style="western">
              <surname>Dorogush</surname>
              <given-names>Anna Veronika</given-names>
            </name>
            <name name-style="western">
              <surname>Gulin</surname>
              <given-names>Andrey</given-names>
            </name>
          </person-group>
          <article-title>CatBoost: unbiased boosting with categorical features</article-title>
          <year>2018</year>
          <month>12</month>
          <day>03</day>
          <conf-name>Proceedings of the 32nd International Conference on Neural Information Processing Systems</conf-name>
          <conf-date>December 3</conf-date>
          <conf-loc>Montréal, Canada</conf-loc>
          <fpage>6639</fpage>
          <lpage>6649</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dl.acm.org/doi/abs/10.5555/3327757.3327770"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Tianqi</given-names>
            </name>
            <name name-style="western">
              <surname>Guestrin</surname>
              <given-names>Carlos</given-names>
            </name>
          </person-group>
          <article-title>XGBoost: a scalable tree boosting system</article-title>
          <year>2016</year>
          <month>08</month>
          <day>13</day>
          <conf-name>Proceedings of the 22nd ACM SIGKDD International Conference on Knowledge Discovery and Data Mining</conf-name>
          <conf-date>August 13</conf-date>
          <conf-loc>San Francisco, California, USA</conf-loc>
          <fpage>785</fpage>
          <lpage>794</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dl.acm.org/doi/10.1145/2939672.2939785"/>
          </comment>
          <pub-id pub-id-type="doi">10.1145/2939672.2939785</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ke</surname>
              <given-names>Guolin</given-names>
            </name>
            <name name-style="western">
              <surname>Meng</surname>
              <given-names>Qi</given-names>
            </name>
            <name name-style="western">
              <surname>Finley</surname>
              <given-names>Thomas</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Taifeng</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Wei</given-names>
            </name>
            <name name-style="western">
              <surname>Ma</surname>
              <given-names>Weidong</given-names>
            </name>
            <name name-style="western">
              <surname>Ye</surname>
              <given-names>Qiwei</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Tie-Yan</given-names>
            </name>
          </person-group>
          <article-title>LightGBM: a highly efficient gradient boosting decision tree</article-title>
          <year>2017</year>
          <month>12</month>
          <day>04</day>
          <conf-name>Proceedings of the 31st International Conference on Neural Information Processing Systems</conf-name>
          <conf-date>December 13</conf-date>
          <conf-loc>Long Beach, California, USA</conf-loc>
          <fpage>3149</fpage>
          <lpage>3157</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dl.acm.org/doi/10.5555/3294996.3295074"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Choi</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Coyner</surname>
              <given-names>Aaron S</given-names>
            </name>
            <name name-style="western">
              <surname>Kalpathy-Cramer</surname>
              <given-names>Jayashree</given-names>
            </name>
            <name name-style="western">
              <surname>Chiang</surname>
              <given-names>Michael F</given-names>
            </name>
            <name name-style="western">
              <surname>Campbell</surname>
              <given-names>J Peter</given-names>
            </name>
          </person-group>
          <article-title>Introduction to machine learning, neural networks, and deep learning</article-title>
          <source>Transl Vis Sci Technol</source>
          <year>2020</year>
          <month>03</month>
          <day>27</day>
          <volume>9</volume>
          <issue>2</issue>
          <fpage>14</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/32704420"/>
          </comment>
          <pub-id pub-id-type="doi">10.1167/tvst.9.2.14</pub-id>
          <pub-id pub-id-type="medline">32704420</pub-id>
          <pub-id pub-id-type="pii">TVST-19-2007</pub-id>
          <pub-id pub-id-type="pmcid">PMC7347027</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shwartz-Ziv</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Armon</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Tabular data: deep learning is not all you need</article-title>
          <source>Information Fusion</source>
          <year>2022</year>
          <month>05</month>
          <volume>81</volume>
          <fpage>84</fpage>
          <lpage>90</lpage>
          <pub-id pub-id-type="doi">10.1016/j.inffus.2021.11.011</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Antoniadi</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Du</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Guendouz</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Wei</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Mazo</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Becker</surname>
              <given-names>BA</given-names>
            </name>
            <name name-style="western">
              <surname>Mooney</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Current challenges and future opportunities for XAI in machine learning-based clinical decision support systems: a systematic review</article-title>
          <source>Applied Sciences</source>
          <year>2021</year>
          <month>05</month>
          <day>31</day>
          <volume>11</volume>
          <issue>11</issue>
          <fpage>5088</fpage>
          <pub-id pub-id-type="doi">10.3390/app11115088</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rudin</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Stop explaining black box machine learning models for high stakes decisions and use interpretable models instead</article-title>
          <source>Nat Mach Intell</source>
          <year>2019</year>
          <month>05</month>
          <volume>1</volume>
          <issue>5</issue>
          <fpage>206</fpage>
          <lpage>215</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/35603010"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s42256-019-0048-x</pub-id>
          <pub-id pub-id-type="medline">35603010</pub-id>
          <pub-id pub-id-type="pmcid">PMC9122117</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zha</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Bhat</surname>
              <given-names>ZP</given-names>
            </name>
            <name name-style="western">
              <surname>Lai</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Jiang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Zhong</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Hu</surname>
              <given-names>X</given-names>
            </name>
          </person-group>
          <article-title>Data-centric artificial intelligence: a survey</article-title>
          <source>ACM Comput Surv</source>
          <year>2025</year>
          <month>01</month>
          <day>24</day>
          <volume>57</volume>
          <issue>5</issue>
          <fpage>1</fpage>
          <lpage>42</lpage>
          <pub-id pub-id-type="doi">10.1145/3711118</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>KB</given-names>
            </name>
            <name name-style="western">
              <surname>Wei</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Weeraratne</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Frisse</surname>
              <given-names>ME</given-names>
            </name>
            <name name-style="western">
              <surname>Misulis</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Rhee</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Snowdon</surname>
              <given-names>JL</given-names>
            </name>
          </person-group>
          <article-title>Precision medicine, AI, and the future of personalized health care</article-title>
          <source>Clin Transl Sci</source>
          <year>2021</year>
          <month>01</month>
          <volume>14</volume>
          <issue>1</issue>
          <fpage>86</fpage>
          <lpage>93</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/32961010"/>
          </comment>
          <pub-id pub-id-type="doi">10.1111/cts.12884</pub-id>
          <pub-id pub-id-type="medline">32961010</pub-id>
          <pub-id pub-id-type="pmcid">PMC7877825</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Collins</surname>
              <given-names>Gary S</given-names>
            </name>
            <name name-style="western">
              <surname>Moons</surname>
              <given-names>Karel G M</given-names>
            </name>
            <name name-style="western">
              <surname>Dhiman</surname>
              <given-names>Paula</given-names>
            </name>
            <name name-style="western">
              <surname>Riley</surname>
              <given-names>Richard D</given-names>
            </name>
            <name name-style="western">
              <surname>Beam</surname>
              <given-names>Andrew L</given-names>
            </name>
            <name name-style="western">
              <surname>Van Calster</surname>
              <given-names>Ben</given-names>
            </name>
            <name name-style="western">
              <surname>Ghassemi</surname>
              <given-names>Marzyeh</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Xiaoxuan</given-names>
            </name>
            <name name-style="western">
              <surname>Reitsma</surname>
              <given-names>Johannes B</given-names>
            </name>
            <name name-style="western">
              <surname>van Smeden</surname>
              <given-names>Maarten</given-names>
            </name>
            <name name-style="western">
              <surname>Boulesteix</surname>
              <given-names>Anne-Laure</given-names>
            </name>
            <name name-style="western">
              <surname>Camaradou</surname>
              <given-names>Jennifer Catherine</given-names>
            </name>
            <name name-style="western">
              <surname>Celi</surname>
              <given-names>Leo Anthony</given-names>
            </name>
            <name name-style="western">
              <surname>Denaxas</surname>
              <given-names>Spiros</given-names>
            </name>
            <name name-style="western">
              <surname>Denniston</surname>
              <given-names>Alastair K</given-names>
            </name>
            <name name-style="western">
              <surname>Glocker</surname>
              <given-names>Ben</given-names>
            </name>
            <name name-style="western">
              <surname>Golub</surname>
              <given-names>Robert M</given-names>
            </name>
            <name name-style="western">
              <surname>Harvey</surname>
              <given-names>Hugh</given-names>
            </name>
            <name name-style="western">
              <surname>Heinze</surname>
              <given-names>Georg</given-names>
            </name>
            <name name-style="western">
              <surname>Hoffman</surname>
              <given-names>Michael M</given-names>
            </name>
            <name name-style="western">
              <surname>Kengne</surname>
              <given-names>André Pascal</given-names>
            </name>
            <name name-style="western">
              <surname>Lam</surname>
              <given-names>Emily</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>Naomi</given-names>
            </name>
            <name name-style="western">
              <surname>Loder</surname>
              <given-names>Elizabeth W</given-names>
            </name>
            <name name-style="western">
              <surname>Maier-Hein</surname>
              <given-names>Lena</given-names>
            </name>
            <name name-style="western">
              <surname>Mateen</surname>
              <given-names>Bilal A</given-names>
            </name>
            <name name-style="western">
              <surname>McCradden</surname>
              <given-names>Melissa D</given-names>
            </name>
            <name name-style="western">
              <surname>Oakden-Rayner</surname>
              <given-names>Lauren</given-names>
            </name>
            <name name-style="western">
              <surname>Ordish</surname>
              <given-names>Johan</given-names>
            </name>
            <name name-style="western">
              <surname>Parnell</surname>
              <given-names>Richard</given-names>
            </name>
            <name name-style="western">
              <surname>Rose</surname>
              <given-names>Sherri</given-names>
            </name>
            <name name-style="western">
              <surname>Singh</surname>
              <given-names>Karandeep</given-names>
            </name>
            <name name-style="western">
              <surname>Wynants</surname>
              <given-names>Laure</given-names>
            </name>
            <name name-style="western">
              <surname>Logullo</surname>
              <given-names>Patricia</given-names>
            </name>
          </person-group>
          <article-title>TRIPOD+AI statement: updated guidance for reporting clinical prediction models that use regression or machine learning methods</article-title>
          <source>BMJ</source>
          <year>2024</year>
          <month>04</month>
          <day>16</day>
          <volume>385</volume>
          <fpage>e078378</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.bmj.com/lookup/pmidlookup?view=long&#38;pmid=38626948"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/bmj-2023-078378</pub-id>
          <pub-id pub-id-type="medline">38626948</pub-id>
          <pub-id pub-id-type="pmcid">PMC11019967</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rudrapatna</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Butte</surname>
              <given-names>Atul J</given-names>
            </name>
          </person-group>
          <article-title>Opportunities and challenges in using real-world data for health care</article-title>
          <source>J Clin Invest</source>
          <year>2020</year>
          <month>03</month>
          <day>03</day>
          <volume>130</volume>
          <issue>2</issue>
          <fpage>565</fpage>
          <lpage>574</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1172/JCI129197"/>
          </comment>
          <pub-id pub-id-type="doi">10.1172/JCI129197</pub-id>
          <pub-id pub-id-type="medline">32011317</pub-id>
          <pub-id pub-id-type="pii">129197</pub-id>
          <pub-id pub-id-type="pmcid">PMC6994109</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
