<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMIR</journal-id>
      <journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id>
      <journal-title>Journal of Medical Internet Research</journal-title>
      <issn pub-type="epub">1438-8871</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v27i1e73190</article-id>
      <article-id pub-id-type="pmid">40344663</article-id>
      <article-id pub-id-type="doi">10.2196/73190</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Development of a 5-Year Risk Prediction Model for Transition From Prediabetes to Diabetes Using Machine Learning: Retrospective Cohort Study</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Sarvestan</surname>
            <given-names> Javad</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Gorrepati</surname>
            <given-names>Leela Prasad</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Dhillon</surname>
            <given-names>Reshvinder</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Agu</surname>
            <given-names>Chiamaka Pamela</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Zhang</surname>
            <given-names>Yongsheng</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0009-0714-3374</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Zhang</surname>
            <given-names>Hongyu</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0007-2700-1854</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Wang</surname>
            <given-names>Dawei</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0008-3283-9958</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Li</surname>
            <given-names>Na</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0003-8466-3388</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Lv</surname>
            <given-names>Haoyue</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0007-6009-0166</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Zhang</surname>
            <given-names>Guang</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Department of Health Management</institution>
            <institution>The First Affiliated Hospital of Shandong First Medical University &#38; Shandong Provincial Qianfoshan Hospital</institution>
            <addr-line>16766 Jingshi Road</addr-line>
            <addr-line>Jinan, 250014</addr-line>
            <country>China</country>
            <phone>86 19353116378</phone>
            <email>zgpap2015@126.com</email>
          </address>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-6630-1912</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Department of Health Management</institution>
        <institution>The First Affiliated Hospital of Shandong First Medical University &#38; Shandong Provincial Qianfoshan Hospital</institution>
        <addr-line>Jinan</addr-line>
        <country>China</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Shandong Engineering Research Center of Health Management, Shandong Institute of Health Management</institution>
        <institution>The First Affiliated Hospital of Shandong First Medical University &#38; Shandong Provincial Qianfoshan Hospital</institution>
        <addr-line>Jinan</addr-line>
        <country>China</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Department of Occupational Health</institution>
        <institution>Shizhong District Center for Disease Control and Prevention</institution>
        <addr-line>Jinan</addr-line>
        <country>China</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>Postgraduate Department</institution>
        <institution>Shandong First Medical University, Shandong Academy of Medical Sciences</institution>
        <addr-line>Jinan</addr-line>
        <country>China</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Guang Zhang <email>zgpap2015@126.com</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2025</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>9</day>
        <month>5</month>
        <year>2025</year>
      </pub-date>
      <volume>27</volume>
      <elocation-id>e73190</elocation-id>
      <history>
        <date date-type="received">
          <day>26</day>
          <month>2</month>
          <year>2025</year>
        </date>
        <date date-type="rev-request">
          <day>17</day>
          <month>3</month>
          <year>2025</year>
        </date>
        <date date-type="rev-recd">
          <day>7</day>
          <month>4</month>
          <year>2025</year>
        </date>
        <date date-type="accepted">
          <day>17</day>
          <month>4</month>
          <year>2025</year>
        </date>
      </history>
      <copyright-statement>©Yongsheng Zhang, Hongyu Zhang, Dawei Wang, Na Li, Haoyue Lv, Guang Zhang. Originally published in the Journal of Medical Internet Research (https://www.jmir.org), 09.05.2025.</copyright-statement>
      <copyright-year>2025</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research (ISSN 1438-8871), is properly cited. The complete bibliographic information, a link to the original publication on https://www.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://www.jmir.org/2025/1/e73190" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Diabetes has emerged as a critical global public health crisis. Prediabetes, as the transitional phase with 5%-10% annual progression to diabetes, offers a critical window for intervention. The lack of a 5-year risk prediction model for diabetes progression among Chinese individuals with prediabetes limits clinical decision-making support.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>This study aimed to develop and validate a machine learning–based 5-year risk prediction model of progression from prediabetes to diabetes for the Chinese population and establish an interactive web-based platform to facilitate high-risk patients identifying and early targeted interventions, ultimately reducing diabetes incidence and health care burdens.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>A retrospective cohort study was conducted on 2 prediabetes cohorts from 2 Chinese medical centers (primary cohort: n=6578 and external validation cohort: n=2333) tracking from 2019 to 2024. Participants meeting the American Diabetes Association (ADA) criteria (prediabetes: hemoglobin A1c [HbA1c] level of 5.7%-6.4%; diabetes: HbA1c level of ≥6.5%) were identified. A total of 42 variables (demographics, physical measures, and hematologic biomarkers) were collected using standardized protocols. Patients were split into the training (70%) and test (30%) sets randomly in the primary cohort. Significant predictors were selected on the training set using recursive feature elimination methods, followed by prediction model development using 7 machine learning algorithms (logistic regression, random forest, support vector machine, multilayer perceptron, extreme gradient boosting machine, light gradient boosting machine, and categorical boosting machine [CatBoost]), optimized through grid search and 5-fold cross-validation. Model performance was assessed using the receiver operating characteristic curve, the precision-recall curves, accuracy, sensitivity, and specificity as well as multiple other metrics on both the test set and the external test set.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>During the follow-up of 5 years, 2610 (41.6%) participants and 760 (35.2%) participants progressed from prediabetes to diabetes, with mean annual progression rates of 8.34% and 7.04% in the primary cohort and the external cohort, respectively. Using 14 features selected using the recursive feature elimination-logistic algorithm, the CatBoost model achieved optimal performance in the test set and the external test set with an area under the receiver operating characteristic curve of 0.819 and 0.807, respectively. It also showed the best discrimination performance on the accuracy, negative predictive value (NPV), and F1-scores as well as the calibration performances in both the test set and the external test set. Then the Shapley Additive Explanations (SHAP) analysis highlighted the top 6 predictors (FBG, HDL, ALT/AST, BMI, age, and MONO), enabling targeted modification of these risk factors to reduce diabetes incidence.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>We developed a 5-year risk prediction model of progression from prediabetes to diabetes for the Chinese population, with the CatBoost model showing the best predictive performance, which could effectively identify individuals at high risk of diabetes.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>Chinese population</kwd>
        <kwd>CatBoost</kwd>
        <kwd>SHAP</kwd>
        <kwd>risk factors</kwd>
        <kwd>clinical decision support</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>Diabetes has become a severe global public health concern, affecting 537 million adults aged 20-79 years worldwide and threatening 860 million adults worldwide due to impaired glucose tolerance and impaired fasting glucose, which are commonly known as prediabetes [<xref ref-type="bibr" rid="ref1">1</xref>]. The burden of diabetes now surpasses the combined global impact of tuberculosis, AIDS, and malaria [<xref ref-type="bibr" rid="ref2">2</xref>]. In 2021, China had approximately 141 million adults with diabetes and 197 million adults with prediabetes, ranking first globally for both conditions [<xref ref-type="bibr" rid="ref1">1</xref>]. Prediabetes is typically viewed as a transitional stage of diabetes, which can return to normal or progress to diabetes [<xref ref-type="bibr" rid="ref3">3</xref>]. Around 5%-10% of patients with prediabetes progress to diabetes every year, and up to 70% could develop diabetes eventually [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref5">5</xref>]. However, with lifestyle intervention and medications, the risk of diabetes in patients with prediabetes can be greatly decreased [<xref ref-type="bibr" rid="ref6">6</xref>]. Therefore, identifying high-risk individuals among patients with prediabetes and intervening in advance could greatly reduce the incidence and health care burden of diabetes.</p>
      <p>Machine learning has been widely used in the field of diabetes and prediabetes, including early diagnosis and risk prediction. Xue et al [<xref ref-type="bibr" rid="ref7">7</xref>] built four machine learning models to diagnose type 2 diabetes using physical measurements and questionnaire information. Abnoosian et al [<xref ref-type="bibr" rid="ref8">8</xref>] developed an integrated multiclassifier machine learning model using various data preprocessing techniques and machine learning algorithms to identify patients with 3 conditions: diabetic, prediabetic, and nondiabetic. Hu et al [<xref ref-type="bibr" rid="ref9">9</xref>] constructed a model to predict the 5-year risk of developing prediabetes in the Chinese population. Schallmoser et al [<xref ref-type="bibr" rid="ref10">10</xref>] created 2 machine learning models for predicting the risk of microvascular or macrovascular complications within 5 years in patients with prediabetes or diabetes. In terms of the progression from prediabetes to diabetes, Cahn et al [<xref ref-type="bibr" rid="ref11">11</xref>] constructed a 1-year risk prediction model using 3 datasets, demonstrating superior accuracy (area under the receiver operating characteristic curve [AUC] 0.865-0.925) over logistic regression. Liu et al [<xref ref-type="bibr" rid="ref12">12</xref>] developed a 1- or 2-year risk prediction model for the Chinese older adults based on extreme gradient boosting machine (XGBoost), demonstrating modest predictive performance (AUC 0.67). Chen et al [<xref ref-type="bibr" rid="ref13">13</xref>] built a 3-year risk prediction model for the Chinese based on logistic regression using 9 indicators and achieved optimal performance (AUC 0.78). Aoki et al [<xref ref-type="bibr" rid="ref14">14</xref>] created a 5-year risk prediction model (AUC 0.87) for Americans based on the random forest using 8 laboratory indicators. Although these predictive models for the progression of prediabetes have been developed, Chinese-focused models are limited to short observation periods (≤3 years), and there is currently a lack of a 5-year prediction model specifically tailored to the Chinese population. Prediabetes often undergoes a gradual progression that can last for over 10 years; hence, a long-term risk prediction model would be more meaningful than a short-term prediction model. Therefore, to address this clinical and geographical gap, we aimed to develop and validate a 5-year risk prediction model for the progression from prediabetes to diabetes within the Chinese population, and to establish an interactive web-based platform for easy clinical practice.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Participants</title>
        <p>This research was a retrospective cohort study that used health checkup data from 2 independent medical centers, namely the First Affiliated Hospital of Shandong First Medical University (the primary cohort) and Binzhou Medical University Hospital (the external cohort). Participants were tracked from 2019 to 2024 over a consecutive 5-year period, with annual assessments conducted at a fixed time each year to evaluate diabetes progression based on the American Diabetes Association (ADA) diagnostic criterion of a hemoglobin A<sub>1c</sub> (HbA<sub>1c</sub>) level of ≥6.5% [<xref ref-type="bibr" rid="ref15">15</xref>]. Inclusion criteria required participants to have a confirmed diagnosis of prediabetes (HbA<sub>1c</sub> level of 5.7%-6.4%) at the 2019 baseline examination. Exclusion criteria ‌included pre-existing diabetes (HbA<sub>1c</sub> level of ≥6.5% or use of glucose-lowering therapy), history of gestational diabetes, use of medications known to affect glucose metabolism, any previous diagnosis of malignancy, and absence of a second physical examination after the year of 2019. After finalizing study cohort and variable selection, data cleaning was performed by removing participants with any missing values. This complete-case analysis approach is methodologically sound when the proportion of missing data is minimal, as it ensures data integrity while maintaining sufficient statistical power. The study design is illustrated in <xref rid="figure1" ref-type="fig">Figure 1</xref>.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Flowchart of this study. RFE: recursive feature elimination.</p>
          </caption>
          <graphic xlink:href="jmir_v27i1e73190_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Data Collection</title>
        <p>We collected 42 variables in total from the database based on literature review, clinical expertise, and data availability, including demographics, physical measures, and hematologic biomarkers. These variables are gender, age, height, weight, BMI, systolic blood pressure, diastolic blood pressure, white blood cell, neutrophil count, lymphocyte count, monocyte count (MONO), hemoglobin, red blood cell (RBC), platelet count, alanine aminotransferase (ALT), aspartate aminotransferase (AST), ALT to AST ratio (ALT/AST), gamma-glutamyl transferase, alkaline phosphatase, total bilirubin, direct bilirubin, indirect bilirubin, total protein, albumin, globulin, albumin to globulin ratio (albumin/globulin), triglycerides, total cholesterol (TC), high-density lipoprotein cholesterol (HDL), low-density lipoprotein cholesterol (LDL), HDL to TC ratio (HDL/TC), blood urea nitrogen (BUN), creatinine, uric acid, estimated glomerular filtration rate, BUN to creatinine ratio (BUN/creatinine), fasting blood glucose (FBG), hematocrit, mean corpuscular hemoglobin, triglyceride-glucose, monocyte to high-density lipoprotein cholesterol ratio, and neutrophil to high-density lipoprotein cholesterol ratio.</p>
        <p>Physical and laboratory examinations are carried out by trained medical staff in accordance with uniform standards. Height and weight measurements require participants to remove heavy clothing and take off shoes. The fully automatic electronic sphygmomanometer was used to measure the participants’ blood pressure in the right upper arm after sitting still and resting for 10 min. The measurement of blood pressure was made twice, each time with an interval of 1-2 minutes, and the average of the 2 readings was taken and recorded. Blood samples were collected from the antecubital vein after an 8- to 10-hour fast and were promptly sent to the clinical laboratory for processing. BMI was calculated as weight (kg) divided by the square of height (m²), and triglyceride-glucose was calculated as Ln (fasting triglycerides [mg/dL] × fasting glucose [mg/dL]/2).</p>
      </sec>
      <sec>
        <title>Statistical Analysis</title>
        <p>Baseline characteristics were analyzed using R version 4.3.1 (R Foundation for Statistical Computing). Quantitative data were analyzed using Student <italic>t</italic> test or nonparametric Wilcoxon signed-rank test, while qualitative data were analyzed using chi-square test or Fisher exact test. Statistical significance thresholds were set at <italic>P</italic>&#60;.05 for all comparative analyses.</p>
        <p>Model training and validation were conducted using the scikit-learn package (version 1.4.0) in Python (version 3.11.5). Initially, the primary cohort was randomly divided into a training set (comprising 70% of the participants) and a test set (comprising the remaining 30%) [<xref ref-type="bibr" rid="ref16">16</xref>]. To ensure better model performance and reduce redundant features, recursive feature elimination (RFE) was used on the training set for feature selection with the logistic regression model as the base model [<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref17">17</xref>]. Subsequently, 7 machine learning algorithms were selected, namely logistic regression, random forest, support vector machine, multilayer perceptron, XGBoost, light gradient boosting machine, and categorical boosting machine (CatBoost) to construct the prediction models. These models were trained and optimized on the training set, with the optimal parameters determined using grid search and 5-fold cross-validation. The next step involved validating the models’ discrimination and calibration ability using the test set of the primary cohort and the external cohort. The discrimination ability of different models was compared using AUC and the area under the precision-recall (PR) curve, along with accuracy, sensitivity, specificity, positive predictive value, NPV, and <italic>F</italic><sub>1</sub>-score. The DeLong test was used for comparing AUC differences between models‌. The calibration ability of different models was compared using the calibration curves to assess the consistency between predicted and observed values. The Shapley Additive Explanations (SHAP) method was used to analyze variable importance for the best-performing machine learning model. Finally, decision curve analysis was used to evaluate the clinical application values of each machine learning model, and an interactive web page for easy clinical use was developed using the Python Gradio framework.</p>
      </sec>
      <sec>
        <title>Ethical Considerations</title>
        <p>This study followed the principles of the Declaration of Helsinki and was approved by the Ethics Committee of the First Affiliated Hospital of Shandong First Medical University (2024S657), and the informed consent was waived off by the review boards due to the retrospective nature of this research. All the images and tables presented in the manuscript and supplementary materials were anonymized in accordance with ethical standards, ensuring no personally identifiable information could be discerned.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Baseline Characteristics</title>
        <p>This study enrolled 6270 eligible participants in the primary cohort and 2157 in the external cohort. Over a 5-year period, 2610 participants (41.6%) in the primary cohort and 760 (35.2%) in the external cohort progressed from prediabetes to diabetes, with mean annual progression rates of 8.33% and 7.04%. The characteristics of the primary and external cohorts are shown in Table S1 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. Over the 5-year follow-up period, 510 participants were lost to follow-up in the primary cohort. A comparative analysis of baseline characteristics between the lost to follow-up group (n=510) and the completed follow-up group (n=6270) revealed no statistically significant differences in any observed variables (<italic>P</italic>&#62;.05) as shown in Table S2 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. Given the lost-to-follow-up–rate of 7.5% (510/6780) and 5.2% (127/2430) in the primary and the external cohort respectively, the demonstrated baseline equivalence between groups, we conclude that the cases lost to follow-up are unlikely to compromise the validity of the analytical outcomes.</p>
      </sec>
      <sec>
        <title>Model Construction and Validation</title>
        <p>The RFE-logistic feature selection algorithm finally screened 14 out of 42 health checkup variables using the training set of the primary cohort, which were hematocrit, hemoglobin, RBC, MONO, FBG, HDL/TC, LDL, HDL, creatinine, ALT/AST, age, height, weight, and BMI. As illustrated in Figure S1 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>, the RFE-logistic cross-validation analysis demonstrated a plateau in AUC ‌when reaching‌ 14 features, ‌with no significant improvement observed‌ when incorporating more features. As shown in Table S3 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>, the RFE ranking system eliminated lower-priority variables through iterative cross-validation (where rank=1 denotes retained features, and higher ranks reflect earlier elimination during the feature selection process‌). The discrimination performances of the 7 machine learning models on the test set and the external test set were shown in <xref rid="figure2" ref-type="fig">Figure 2</xref> and <xref ref-type="table" rid="table1">Table 1</xref>, in which the ROC curves indicated that the CatBoost model had the best performance on both of the test sets (AUC 0.819) and the external test set (AUC 0.807), and the DeLong test revealed that the differences in AUC values for the models on 2 cohorts were statistically significant (<italic>P</italic>&#60;.05). The PR curve analysis further confirmed the superior discriminative performance of the CatBoost model, demonstrating significant advantages on both sets. In addition, the CatBoost model showed the best accuracy (74.6%), sensitivity (0.648), NPV (0.765), <italic>F</italic><sub>1</sub>-score (0.68) on the test set, and the best accuracy (75.9%), NPV (0.787), and <italic>F</italic><sub>1</sub>-score (0.626) on the external test set. The confusion matrix for the 7 machine learning models on both sets is shown in Figure S2 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p>
        <p>Meanwhile, the calibration performances of the 7 models on the test set and the external test set were evaluated using calibration curves as shown in plots A and C in <xref rid="figure3" ref-type="fig">Figure 3</xref>, in which the black curve corresponding to the CatBoost model had been distributed closest to the dashed line in the middle, indicating the best calibration ability in both sets. The clinical application value of the 7 models on the test set and the external test set were evaluated using decision curves as shown in plot B and D in <xref rid="figure3" ref-type="fig">Figure 3</xref>, in which the area under the curve of the CatBoost model reached the maximum, and when the threshold probability was less than around 0.80, all the clinical decisions made would be beneficial to the patients.</p>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Receiver operating characteristic curve and precision-recall curve curves of the 7 models on the test set and the external test set. Plots A and B depict the model performances on the test set, and plots C and D present the model performances on the external test set. CatBoost: categorical boosting; LightGBM: light gradient boosting machine; MLP: multiplayer perceptron; ROC: receiver operating characteristic; SVM: support vector machine; XGBoost: extreme gradient boosting machine.</p>
          </caption>
          <graphic xlink:href="jmir_v27i1e73190_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>The metrics of model performance on the test set and the external test set.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="270"/>
            <col width="0"/>
            <col width="160"/>
            <col width="0"/>
            <col width="110"/>
            <col width="0"/>
            <col width="130"/>
            <col width="0"/>
            <col width="100"/>
            <col width="0"/>
            <col width="100"/>
            <col width="0"/>
            <col width="100"/>
            <thead>
              <tr valign="top">
                <td colspan="3">Models</td>
                <td colspan="2">Accuracy</td>
                <td colspan="2">Sensitivity</td>
                <td colspan="2">Specificity</td>
                <td colspan="2">PPV<sup>a</sup></td>
                <td colspan="2">NPV<sup>b</sup></td>
                <td><italic>F</italic><sub>1</sub>-score</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="14">
                  <bold>The test set in the primary cohort</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Logistic regression</td>
                <td colspan="2">0.739</td>
                <td colspan="2">0.577</td>
                <td colspan="2">0.854</td>
                <td colspan="2">0.738</td>
                <td colspan="2">0.739</td>
                <td colspan="2">0.648</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Random forest</td>
                <td colspan="2">0.741</td>
                <td colspan="2">0.592</td>
                <td colspan="2">0.846</td>
                <td colspan="2">0.732</td>
                <td colspan="2">0.745</td>
                <td colspan="2">0.655</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>SVM<sup>c</sup></td>
                <td colspan="2">0.677</td>
                <td colspan="2">0.277</td>
                <td colspan="2">0.961</td>
                <td colspan="2">0.834</td>
                <td colspan="2">0.651</td>
                <td colspan="2">0.417</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>XGBoost<sup>d</sup></td>
                <td colspan="2">0.74</td>
                <td colspan="2">0.647</td>
                <td colspan="2">0.806</td>
                <td colspan="2">0.704</td>
                <td colspan="2">0.762</td>
                <td colspan="2">0.674</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>MLP<sup>e</sup></td>
                <td colspan="2">0.665</td>
                <td colspan="2">0.367</td>
                <td colspan="2">0.877</td>
                <td colspan="2">0.68</td>
                <td colspan="2">0.66</td>
                <td colspan="2">0.477</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>LightGBM<sup>f</sup></td>
                <td colspan="2">0.744</td>
                <td colspan="2">0.61</td>
                <td colspan="2">0.838</td>
                <td colspan="2">0.729</td>
                <td colspan="2">0.751</td>
                <td colspan="2">0.664</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>CatBoost<sup>g</sup></td>
                <td colspan="2">0.746</td>
                <td colspan="2">0.648</td>
                <td colspan="2">0.816</td>
                <td colspan="2">0.715</td>
                <td colspan="2">0.765</td>
                <td colspan="2">0.68</td>
              </tr>
              <tr valign="top">
                <td colspan="14">
                  <bold>The external test set</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Logistic regression</td>
                <td colspan="2">0.749</td>
                <td colspan="2">0.45</td>
                <td colspan="2">0.913</td>
                <td colspan="2">0.737</td>
                <td colspan="2">0.753</td>
                <td colspan="2">0.559</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Random forest</td>
                <td colspan="2">0.755</td>
                <td colspan="2">0.578</td>
                <td colspan="2">0.852</td>
                <td colspan="2">0.68</td>
                <td colspan="2">0.786</td>
                <td colspan="2">0.624</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>SVM</td>
                <td colspan="2">0.75</td>
                <td colspan="2">0.468</td>
                <td colspan="2">0.904</td>
                <td colspan="2">0.727</td>
                <td colspan="2">0.758</td>
                <td colspan="2">0.57</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>XGBoost</td>
                <td colspan="2">0.74</td>
                <td colspan="2">0.554</td>
                <td colspan="2">0.842</td>
                <td colspan="2">0.656</td>
                <td colspan="2">0.776</td>
                <td colspan="2">0.601</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>MLP</td>
                <td colspan="2">0.717</td>
                <td colspan="2">0.499</td>
                <td colspan="2">0.836</td>
                <td colspan="2">0.623</td>
                <td colspan="2">0.754</td>
                <td colspan="2">0.554</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>LightGBM</td>
                <td colspan="2">0.747</td>
                <td colspan="2">0.424</td>
                <td colspan="2">0.923</td>
                <td colspan="2">0.75</td>
                <td colspan="2">0.747</td>
                <td colspan="2">0.542</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>CatBoost</td>
                <td colspan="2">0.759</td>
                <td colspan="2">0.572</td>
                <td colspan="2">0.86</td>
                <td colspan="2">0.69</td>
                <td colspan="2">0.787</td>
                <td colspan="2">0.626</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>PPV: positive predictive value.</p>
            </fn>
            <fn id="table1fn2">
              <p><sup>b</sup>NPV: negative predictive value.</p>
            </fn>
            <fn id="table1fn3">
              <p><sup>c</sup>SVM: support vector machine.</p>
            </fn>
            <fn id="table1fn4">
              <p><sup>d</sup>XGBoost: extreme gradient boosting.</p>
            </fn>
            <fn id="table1fn5">
              <p><sup>e</sup>MLP: multiplayer perceptron.</p>
            </fn>
            <fn id="table1fn6">
              <p><sup>f</sup>LightGBM: light gradient boosting machine.</p>
            </fn>
            <fn id="table1fn7">
              <p><sup>g</sup>CatBoost: categorical boosting.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>The calibration curves and clinical decision curves of the 7 models on the test set and the external test set. Plots A and B depict the model performances on the test set, and plots C and D present the model performances on the external test set. CatBoost: categorical boosting; LightGBM: light gradient boosting machine; MLP: multiplayer perceptron; SVM: support vector machine; XGBoost: extreme gradient boosting machine.</p>
          </caption>
          <graphic xlink:href="jmir_v27i1e73190_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Feature Importance</title>
        <p>The SHAP analysis of the best-performing CatBoost model is shown in <xref rid="figure4" ref-type="fig">Figure 4</xref>. The top 6 variables contributing most to the model were FBG, HDL, ALT/AST, BMI, age, and MONO, where HDL and ALT/AST were negatively correlated with the outcome, that is, protective against progression to diabetes, and the rest were positively correlated and risky for progression to diabetes. Baseline FBG was the most important factor affecting the CatBoost model. In addition, the SHAP dependency plots for the 6 features were shown in <xref rid="figure5" ref-type="fig">Figure 5</xref>, which showed the correspondence between the change in the value of variables and the change of importance to the CatBoost model indicated by SHAP values. Finally, we constructed the user-friendly interactive web interface of the prediction model for progression from prediabetes to diabetes as shown in Figure S3 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p>
        <fig id="figure4" position="float">
          <label>Figure 4</label>
          <caption>
            <p>SHapley Additive exPlanations feature importance and summary plot of the CatBoost model. ALT: alanine aminotransferase; AST: aspartate aminotransferase; FBG: fasting blood glucose; HDL: high-density lipoprotein cholesterol; LDL: low-density lipoprotein cholesterol; MONO: monocyte count; RBC: red blood cell.</p>
          </caption>
          <graphic xlink:href="jmir_v27i1e73190_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure5" position="float">
          <label>Figure 5</label>
          <caption>
            <p>The Shapley Additive Explanations dependency plots for the top 6 features. ALT: alanine aminotransferase; AST: aspartate aminotransferase; FBG: fasting blood glucose; HDL: high-density lipoprotein cholesterol; MONO: monocyte count.</p>
          </caption>
          <graphic xlink:href="jmir_v27i1e73190_fig5.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
    </sec>
    <sec>
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>In this retrospective cohort study, we used 7 machine learning algorithms to build and evaluate 5-year risk prediction models for the progression from prediabetes to diabetes in 2 different cohorts. Among them, the CatBoost model showed the best performance in terms of discrimination and calibration. The CatBoost model achieved the highest AUC values in both the test set (‌0.819‌) and external validation set (‌0.807‌), outperforming all other models. This indicates its exceptional ability to distinguish individuals who will progress to diabetes from those who will not. The model’s AUC values reflect good discrimination for clinical use (AUC ≥0.8 is often considered strong in risk prediction), placing it in the mid-to-high range of published studies (AUC 0.67-0.87) and approaching top-tier models [<xref ref-type="bibr" rid="ref11">11</xref>-<xref ref-type="bibr" rid="ref14">14</xref>]. The stability of AUC across internal and external test sets (‌&#60;2% difference‌) suggests that the 14 features selected by RFE-logistic capture biologically and clinically generalizable signals, rather than overfitting to cohort-specific noise. Compared with the traditional logistic regression model, the CatBoost model’s improvement‌ in AUC highlights the value of ensemble algorithms in modeling complex interactions between metabolic, hematological, and anthropometric variables.</p>
        <p>Among the 7 evaluated models, the CatBoost algorithm also demonstrated superior performance in sensitivity, NPV, and <italic>F</italic><sub>1</sub>-score‌. In disease screening and risk assessment contexts, high sensitivity holds particular clinical significance as missed diagnoses of high-risk patients may lead to severe health consequences. Our study also took into consideration the cost-benefit analysis of false-positive cases, systematically balancing the economic and psychological burdens against diagnostic sensitivity through optimized thresholds. The CatBoost model exhibited exceptional capability in low-risk population exclusion, achieving NPV of 76.5% and 78.7% in 2 cohorts. This performance positions it as an ideal solution for resource-constrained health care settings, enabling efficient allocation of medical resources to medium- and high-risk subgroups.</p>
        <p>The CatBoost model dominated the space of the precision-recall curve, achieving the highest precision at different recall levels. For example, at a recall of 0.648 in the test set, the model maintained a highest precision of ‌0.715‌. This superiority implies that CatBoost reduces ‌unnecessary interventions‌; for every 100 patients flagged as “high-risk” by CatBoost, 71.5% would truly progress to diabetes. In resource-constrained settings, this precision directly translates to cost savings and reduced patient anxiety. The decision curves further validated the clinical value of the CatBoost model. When the threshold probability for intervention was below 80%, the model provided a net benefit over “treat all” or “treat none” strategies, which means the model remains clinically beneficial across a wide range of risk thresholds, accommodating varying risk tolerance among patients and health care systems.</p>
        <p>SHAP analysis of the feature importance identified FBG, HDL, ALT/AST, BMI, age, and MONO as the top 6 variables contributing the most to the CatBoost model, and an interactive web interface for this model was constructed. This interface provided caregivers with an easy tool to assess the 5-year risk of progression to diabetes in patients with prediabetes. It can be integrated into the health information system in China, which could streamline risk assessment, allowing automated alerts for high-risk prediabetic patients during routine health check-ups. By stratifying patients into risk categories, clinicians can prioritize high-risk individuals for intensive monitoring or early lifestyle intervention, such as dietary changes, physical activity plans, or pharmacological approaches in alignment with current clinical guidelines. The web interface bridges the gap between predictive analytics and clinical decision-making, advocating for a paradigm shift toward data-driven, individualized prevention strategies, emphasizing early intervention in high-risk groups to curb diabetes progression.</p>
      </sec>
      <sec>
        <title>Comparisons With Previous Work</title>
        <p>The application of machine learning techniques has made significant progress in the field of diabetes, opening up new possibilities for early diagnosis and prevention. CatBoost is an advanced machine learning algorithm designed for gradient boosting with decision trees, applicable to a variety of tasks including classification, regression, and ranking. It leverages techniques such as ordered boosting, stochastic permutations, and gradient-driven optimization to deliver superior results [<xref ref-type="bibr" rid="ref18">18</xref>-<xref ref-type="bibr" rid="ref20">20</xref>]. Shojaee et al [<xref ref-type="bibr" rid="ref18">18</xref>] developed a fasting blood glucose status prediction model using the CatBoost algorithm based on 3376 adults older than 30 years at 16 comprehensive health service centers in Tehran, Iran, which demonstrated good performance with 0.737 AUC. Shiren et al [<xref ref-type="bibr" rid="ref19">19</xref>] developed a cutting-edge, interpretable risk assessment model for patients with diabetes. The CatBoost algorithm significantly outperformed the other methods in terms of AUC, delivering an impressive average AUC of 90.47% across 4 diabetes-related complications, namely coronary heart disease, diabetic nephropathy, diabetic retinopathy, and nonalcoholic fatty liver disease. Qiu et al [<xref ref-type="bibr" rid="ref20">20</xref>] constructed a model capable of forecasting the likelihood of cancer in individuals with type 2 diabetes by using tumor biomarkers from a dataset of 5198 patients. The CatBoost model yielded a favorable AUC of 0.852, which might be helpful for early cancer detection and prevention. While CatBoost offers notable advantages, it also has drawbacks. It exhibits higher computational demands compared with lightweight frameworks like light gradient boosting machine (LightGBM), particularly with large datasets. ‌Its performance is sensitive to hyperparameter tuning, demanding significant computational resources and time.‌ In addition, the model’s complexity makes interpretation challenging without external tools like SHAP for transparency.</p>
        <p>The variables selected from RFE-logistic algorithm have been proven to be relevant to diabetes in different ways. Changes in hematocrit can alter red blood cell ratios, affecting HbA<sub>1c</sub> test results and causing overestimation or underestimation of true blood glucose levels in type 2 diabetes [<xref ref-type="bibr" rid="ref21">21</xref>]. HbA<sub>1c</sub> had significant correlations with RBC and hemoglobin because chronic hyperglycemia can exacerbate inflammation and alter hematological parameters in diabetic patients [<xref ref-type="bibr" rid="ref22">22</xref>]. HDL is a protective factor against diabetes, while lower levels of HDL are associated with increased insulin resistance and elevated cardiovascular risk ‌[<xref ref-type="bibr" rid="ref23">23</xref>]. ALT, TC, triglycerides, HDL, and LDL are clinically significant biomarkers associated with diabetes, which serve as sensitive indicators of insulin resistance and metabolic syndrome [<xref ref-type="bibr" rid="ref24">24</xref>]. ‌Studies also demonstrate BMI is a modifiable risk factor for diabetes and its macrovascular and microvascular complications. There are positive correlations between BMI and key glycemic control parameters, FBG and HbA<sub>1c</sub>, highlighting its role in β-cell dysfunction and systemic insulin resistance ‌[<xref ref-type="bibr" rid="ref25">25</xref>]. The results of the feature importance analysis are consistent with the other diabetes studies, where FPG was the most important factor contributing to diabetes risk. As the core diagnostic criterion for diabetes, FBG directly reflects the pathological mechanisms of insulin resistance and β-cell dysfunction‌. Even when FBG levels remain below the diagnostic threshold for diabetes, persistent elevation can accelerate β-cell functional failure through glucotoxic effects‌. In addition, age, BMI, HDL as well as ALT/AST played significant roles in influencing the risk of diabetes [<xref ref-type="bibr" rid="ref11">11</xref>-<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref26">26</xref>-<xref ref-type="bibr" rid="ref28">28</xref>]. Aging directly contributes to the decline of pancreatic β-cell function and reduced insulin sensitivity‌. With aging, diminished hepatic gluconeogenesis regulation and impaired glucose uptake efficiency in muscle tissues progressively destabilize fasting glucose homeostasis‌, which might underlie the critical transition from prediabetes to diabetes‌. We also found that MONO was an important factor contributing to diabetes risk. Monocytes release a variety of inflammatory mediators and participate in the inflammatory and injury processes in our body, and may prompt the progression from prediabetes to diabetes [<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref30">30</xref>].</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>To the best of our knowledge, this study is the first to develop a 5-year risk prediction model for the progression from prediabetes to diabetes based on the Chinese population. China faces a heavy disease and economic burden due to diabetes and its complications, and identifying high-risk populations among patients with prediabetes could reduce the health care burden of diabetes by implementing lifestyle and pharmacological interventions [<xref ref-type="bibr" rid="ref31">31</xref>-<xref ref-type="bibr" rid="ref33">33</xref>]. There are some limitations of our study. First, due to the retrospective nature of this study, the absence of some risk factors, such as smoking, drinking, and the family history of diabetes may introduce residual confounding, while the lack of longitudinal tracking of some variables during follow-up‌ could affect the predictive validity. Second, out of operational practicality, we take HbA<sub>1c</sub> as the sole diagnostic criterion for diabetes in this study. While HbA<sub>1c</sub> demonstrates superior accuracy in reflecting long-term glycemic levels [<xref ref-type="bibr" rid="ref34">34</xref>-<xref ref-type="bibr" rid="ref36">36</xref>], the exclusion of complementary assessments, such as FBG, oral glucose tolerance test, and clinical symptom evaluation, may introduce diagnostic bias, which might reduce the generalizability of our prediction model. Third, the absence of external validation in populations with distinct genetic backgrounds may limit extrapolation to other ethnic groups. In the future, we will establish prospective cohorts to include more risk factors, diagnostic variables, and implement longitudinal monitoring‌. In addition, we will validate our model across diverse ethnic and geographic populations through multi-center collaborations to enhance the generalizability.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>In conclusion, we constructed and evaluated seven 5-year risk prediction models for the progression from prediabetes to diabetes using machine learning algorithms based on the Chinese health checkup cohorts. The CatBoost model demonstrated the best performance, suggesting its potential as an effective tool in the field of diabetes prevention and management. We can embed the model in electronic health records to flag high-risk individuals during annual checkups, enable targeted allocation of glucose monitoring resources, and facilitate early lifestyle modification to these predicted high-risk patients to reduce diabetes incidence and health care burdens.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Additional material.</p>
        <media xlink:href="jmir_v27i1e73190_app1.docx" xlink:title="DOCX File , 566 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">ADA</term>
          <def>
            <p>American Diabetes Association</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">ALT</term>
          <def>
            <p>alanine aminotransferase</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">AST</term>
          <def>
            <p>aspartate aminotransferase</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">AUC</term>
          <def>
            <p>the area under the receiver operating characteristic curve</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">BUN</term>
          <def>
            <p>blood urea nitrogen</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">CatBoost</term>
          <def>
            <p>categorical boosting machine</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">FBG</term>
          <def>
            <p>fasting blood glucose</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">HbA1c</term>
          <def>
            <p>hemoglobin A1c</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb9">HDL</term>
          <def>
            <p>high-density lipoprotein cholesterol</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb10">LDL</term>
          <def>
            <p>low-density lipoprotein cholesterol</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb11">LightGBM</term>
          <def>
            <p>light gradient boosting machine</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb12">MONO</term>
          <def>
            <p>monocyte count</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb13">NPV</term>
          <def>
            <p>negative predictive value</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb14">PR</term>
          <def>
            <p>precision-recall</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb15">RBC</term>
          <def>
            <p>red blood cell</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb16">RFE</term>
          <def>
            <p>recursive feature elimination</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb17">ROC</term>
          <def>
            <p>receiver operating characteristic curve</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb18">SHAP</term>
          <def>
            <p>Shapley Additive Explanations</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb19">TC</term>
          <def>
            <p>total cholesterol</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb20">XGBoost</term>
          <def>
            <p>extreme gradient boosting</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>This work was supported by grants from the Shandong-Chongqing Science and Technology Cooperation Project (2024LYXZ021), the Shandong Provincial Medical Association Research Project (YXH2024YS050), and the Natural Science Foundation of Shandong Province (ZR2023QG014).</p>
    </ack>
    <notes>
      <sec>
        <title>Data Availability</title>
        <p>The datasets generated or analyzed during this study are available from the corresponding author on reasonable request.</p>
      </sec>
    </notes>
    <fn-group>
      <fn fn-type="con">
        <p>YZ contributed to conceptualization, formal analysis, methodology, and writing—original draft. HZ contributed to investigation and data curation. DW contributed to supervision, writing—review and editing. NL and HL contributed to investigation. GZ contributed to funding acquisition, project administration, writing—review and editing.</p>
      </fn>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Magliano</surname>
              <given-names>DJ</given-names>
            </name>
            <name name-style="western">
              <surname>Boyko</surname>
              <given-names>EJ</given-names>
            </name>
          </person-group>
          <article-title>IDF Diabetes Atlas 10th edition scientific committee</article-title>
          <source>IDF Diabetes Atlas</source>
          <year>2021</year>
          <publisher-loc>Brussels</publisher-loc>
          <publisher-name>International Diabetes Federation</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="book">
          <source>State of inequality: HIV, tuberculosis and malaria</source>
          <year>2021</year>
          <publisher-loc>Geneva</publisher-loc>
          <publisher-name>WHO</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Echouffo-Tcheugui</surname>
              <given-names>JB</given-names>
            </name>
            <name name-style="western">
              <surname>Perreault</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Ji</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Dagogo-Jack</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Diagnosis and management of prediabetes: a review</article-title>
          <source>JAMA</source>
          <year>2023</year>
          <month>04</month>
          <day>11</day>
          <volume>329</volume>
          <issue>14</issue>
          <fpage>1206</fpage>
          <lpage>1216</lpage>
          <pub-id pub-id-type="doi">10.1001/jama.2023.4063</pub-id>
          <pub-id pub-id-type="medline">37039787</pub-id>
          <pub-id pub-id-type="pii">2803510</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Marseglia</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Fratiglioni</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Welmer</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>Natural history of prediabetes in older adults from a population-based longitudinal study</article-title>
          <source>J Intern Med</source>
          <year>2019</year>
          <month>09</month>
          <volume>286</volume>
          <issue>3</issue>
          <fpage>326</fpage>
          <lpage>340</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/31165572"/>
          </comment>
          <pub-id pub-id-type="doi">10.1111/joim.12920</pub-id>
          <pub-id pub-id-type="medline">31165572</pub-id>
          <pub-id pub-id-type="pmcid">PMC6851857</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Khan</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Chua</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Tan</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Liao</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>From pre-diabetes to diabetes: diagnosis, treatments and translational research</article-title>
          <source>Medicina (Kaunas)</source>
          <year>2019</year>
          <month>08</month>
          <day>29</day>
          <volume>55</volume>
          <issue>9</issue>
          <fpage>546</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=medicina55090546"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/medicina55090546</pub-id>
          <pub-id pub-id-type="medline">31470636</pub-id>
          <pub-id pub-id-type="pii">medicina55090546</pub-id>
          <pub-id pub-id-type="pmcid">PMC6780236</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Chai</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Yin</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Gong</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Shao</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Effectiveness of different intervention modes in lifestyle intervention for the prevention of type 2 diabetes and the reversion to normoglycemia in adults with prediabetes: systematic review and meta-analysis of randomized controlled trials</article-title>
          <source>J Med Internet Res</source>
          <year>2025</year>
          <month>01</month>
          <day>29</day>
          <volume>27</volume>
          <fpage>e63975</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2025//e63975/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/63975</pub-id>
          <pub-id pub-id-type="medline">39879607</pub-id>
          <pub-id pub-id-type="pii">v27i1e63975</pub-id>
          <pub-id pub-id-type="pmcid">PMC11822313</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Xue</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Su</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Yao</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Identification of potential type II diabetes in a large-scale chinese population using a systematic machine learning framework</article-title>
          <source>J Diabetes Res</source>
          <year>2020</year>
          <volume>2020</volume>
          <fpage>6873891</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1155/2020/6873891"/>
          </comment>
          <pub-id pub-id-type="doi">10.1155/2020/6873891</pub-id>
          <pub-id pub-id-type="medline">33029536</pub-id>
          <pub-id pub-id-type="pmcid">PMC7532405</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Abnoosian</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Farnoosh</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Behzadi</surname>
              <given-names>MH</given-names>
            </name>
          </person-group>
          <article-title>Prediction of diabetes disease using an ensemble of machine learning multi-classifier models</article-title>
          <source>BMC Bioinformatics</source>
          <year>2023</year>
          <month>09</month>
          <day>12</day>
          <volume>24</volume>
          <issue>1</issue>
          <fpage>337</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcbioinformatics.biomedcentral.com/articles/10.1186/s12859-023-05465-z"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12859-023-05465-z</pub-id>
          <pub-id pub-id-type="medline">37697283</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12859-023-05465-z</pub-id>
          <pub-id pub-id-type="pmcid">PMC10496262</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Han</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Cui</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Ni</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Wei</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Cao</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Hu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>He</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>A nomogram model for predicting 5-year risk of prediabetes in Chinese adults</article-title>
          <source>Sci Rep</source>
          <year>2023</year>
          <month>12</month>
          <day>18</day>
          <volume>13</volume>
          <issue>1</issue>
          <fpage>22523</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41598-023-50122-3"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41598-023-50122-3</pub-id>
          <pub-id pub-id-type="medline">38110661</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41598-023-50122-3</pub-id>
          <pub-id pub-id-type="pmcid">PMC10728122</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Schallmoser</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zueger</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Kraus</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Saar-Tsechansky</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Stettler</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Feuerriegel</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Machine learning for predicting micro- and macrovascular complications in individuals with prediabetes or diabetes: retrospective cohort study</article-title>
          <source>J Med Internet Res</source>
          <year>2023</year>
          <month>02</month>
          <day>27</day>
          <volume>25</volume>
          <fpage>e42181</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://boris.unibe.ch/id/eprint/179310"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/42181</pub-id>
          <pub-id pub-id-type="medline">36848190</pub-id>
          <pub-id pub-id-type="pii">v25i1e42181</pub-id>
          <pub-id pub-id-type="pmcid">PMC10012007</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cahn</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Shoshan</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sagiv</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Yesharim</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Goshen</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Shalev</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Raz</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>Prediction of progression from pre-diabetes to diabetes: Development and validation of a machine learning model</article-title>
          <source>Diabetes Metab Res Rev</source>
          <year>2020</year>
          <month>02</month>
          <volume>36</volume>
          <issue>2</issue>
          <fpage>e3252</fpage>
          <pub-id pub-id-type="doi">10.1002/dmrr.3252</pub-id>
          <pub-id pub-id-type="medline">31943669</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>He</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zou</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Guo</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Yan</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Predicting the 2-year risk of progression from prediabetes to diabetes using machine learning among Chinese elderly adults</article-title>
          <source>J Pers Med</source>
          <year>2022</year>
          <month>06</month>
          <day>27</day>
          <volume>12</volume>
          <issue>7</issue>
          <fpage>1055</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=jpm12071055"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/jpm12071055</pub-id>
          <pub-id pub-id-type="medline">35887552</pub-id>
          <pub-id pub-id-type="pii">jpm12071055</pub-id>
          <pub-id pub-id-type="pmcid">PMC9324396</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Zhong</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Cai</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Risk prediction of diabetes progression using big data mining with multifarious physical examination indicators</article-title>
          <source>Diabetes Metab Syndr Obes</source>
          <year>2024</year>
          <volume>17</volume>
          <fpage>1249</fpage>
          <lpage>1265</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.tandfonline.com/doi/abs/10.2147/DMSO.S449955?url_ver=Z39.88-2003&#38;rfr_id=ori:rid:crossref.org&#38;rfr_dat=cr_pub  0pubmed"/>
          </comment>
          <pub-id pub-id-type="doi">10.2147/DMSO.S449955</pub-id>
          <pub-id pub-id-type="medline">38496004</pub-id>
          <pub-id pub-id-type="pii">449955</pub-id>
          <pub-id pub-id-type="pmcid">PMC10942017</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Aoki</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Khalid</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Kaya</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Nagymanyoki</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Hussong</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Salama</surname>
              <given-names>ME</given-names>
            </name>
          </person-group>
          <article-title>Progression from prediabetes to diabetes in a diverse U.S. population: a machine learning model</article-title>
          <source>Diabetes Technol Ther</source>
          <year>2024</year>
          <volume>26</volume>
          <issue>10</issue>
          <fpage>748</fpage>
          <lpage>753</lpage>
          <pub-id pub-id-type="doi">10.1089/dia.2024.0052</pub-id>
          <pub-id pub-id-type="medline">38621172</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Guo</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Feature selection with kernelized multi-class support vector machine</article-title>
          <source>Pattern Recognit</source>
          <year>2021</year>
          <volume>117</volume>
          <fpage>107988</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1016/j.patcog.2021.107988"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.patcog.2021.107988</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Liang</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Zeng</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Xie</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>Machine learning for prediction and risk stratification of lupus nephritis renal flare</article-title>
          <source>Am J Nephrol</source>
          <year>2021</year>
          <volume>52</volume>
          <issue>2</issue>
          <fpage>152</fpage>
          <lpage>160</lpage>
          <pub-id pub-id-type="doi">10.1159/000513566</pub-id>
          <pub-id pub-id-type="medline">33744876</pub-id>
          <pub-id pub-id-type="pii">000513566</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>A novel MissForest-based missing values imputation approach with recursive feature elimination in medical applications</article-title>
          <source>BMC Med Res Methodol</source>
          <year>2024</year>
          <volume>24</volume>
          <issue>1</issue>
          <fpage>269</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedresmethodol.biomedcentral.com/articles/10.1186/s12874-024-02392-2"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12874-024-02392-2</pub-id>
          <pub-id pub-id-type="medline">39516783</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12874-024-02392-2</pub-id>
          <pub-id pub-id-type="pmcid">PMC11546113</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shojaee-Mend</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Velayati</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Tayefi</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Babaee</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Prediction of diabetes using data mining and machine learning algorithms: a cross-sectional study</article-title>
          <source>Healthc Inform Res</source>
          <year>2024</year>
          <volume>30</volume>
          <issue>1</issue>
          <fpage>73</fpage>
          <lpage>82</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/38359851"/>
          </comment>
          <pub-id pub-id-type="doi">10.4258/hir.2024.30.1.73</pub-id>
          <pub-id pub-id-type="medline">38359851</pub-id>
          <pub-id pub-id-type="pii">hir.2024.30.1.73</pub-id>
          <pub-id pub-id-type="pmcid">PMC10879823</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shiren</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Jiangnan</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Xinhua</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Xinye</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Interpretable prediction model for assessing diabetes complication risks in Chinese sufferers</article-title>
          <source>Diabetes Res Clin Pract</source>
          <year>2024</year>
          <volume>209</volume>
          <fpage>111560</fpage>
          <pub-id pub-id-type="doi">10.1016/j.diabres.2024.111560</pub-id>
          <pub-id pub-id-type="medline">38316188</pub-id>
          <pub-id pub-id-type="pii">S0168-8227(24)00043-3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Qiu</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Ma</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>An</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Zong</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Shang</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>A machine learning prediction model for cancer risk in patients with type 2 diabetes based on clinical tests</article-title>
          <source>Technol Health Care</source>
          <year>2024</year>
          <volume>32</volume>
          <issue>3</issue>
          <fpage>1431</fpage>
          <lpage>1443</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/37781827"/>
          </comment>
          <pub-id pub-id-type="doi">10.3233/THC-230385</pub-id>
          <pub-id pub-id-type="medline">37781827</pub-id>
          <pub-id pub-id-type="pii">THC230385</pub-id>
          <pub-id pub-id-type="pmcid">PMC11091618</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Malaba</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kosiyo</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Guyah</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Haemoglobin types and variant interference with HbA1c and its association with uncontrolled HbA1c in type 2 diabetes mellitus</article-title>
          <source>BMC Res Notes</source>
          <year>2024</year>
          <volume>17</volume>
          <issue>1</issue>
          <fpage>342</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcresnotes.biomedcentral.com/articles/10.1186/s13104-024-06982-7"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s13104-024-06982-7</pub-id>
          <pub-id pub-id-type="medline">39574185</pub-id>
          <pub-id pub-id-type="pii">10.1186/s13104-024-06982-7</pub-id>
          <pub-id pub-id-type="pmcid">PMC11583738</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Antwi-Baffour</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Mensah</surname>
              <given-names>BT</given-names>
            </name>
            <name name-style="western">
              <surname>Armah</surname>
              <given-names>DNO</given-names>
            </name>
            <name name-style="western">
              <surname>Ali-Mustapha</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Annison</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Comparative analysis of glycated haemoglobin, fasting blood glucose and haematological parameters in type-2 diabetes patients</article-title>
          <source>BMC Res Notes</source>
          <year>2023</year>
          <volume>16</volume>
          <issue>1</issue>
          <fpage>256</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcresnotes.biomedcentral.com/articles/10.1186/s13104-023-06520-x"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s13104-023-06520-x</pub-id>
          <pub-id pub-id-type="medline">37798652</pub-id>
          <pub-id pub-id-type="pii">10.1186/s13104-023-06520-x</pub-id>
          <pub-id pub-id-type="pmcid">PMC10557280</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Gu</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Mu</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Remnant cholesterol, but not other traditional lipids or lipid ratios, is independently and positively related to future diabetes risk in Chinese general population: a 3 year cohort study</article-title>
          <source>J Diabetes Investig</source>
          <year>2024</year>
          <volume>15</volume>
          <issue>8</issue>
          <fpage>1084</fpage>
          <lpage>1093</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://onlinelibrary.wiley.com/doi/10.1111/jdi.14205"/>
          </comment>
          <pub-id pub-id-type="doi">10.1111/jdi.14205</pub-id>
          <pub-id pub-id-type="medline">38568177</pub-id>
          <pub-id pub-id-type="pmcid">PMC11292390</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hao</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Huo</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Zhen</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Gao</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Ren</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Circulating bone morphogenetic protein-9 is decreased in patients with type 2 diabetes and non-alcoholic fatty liver disease</article-title>
          <source>Int J Gen Med</source>
          <year>2022</year>
          <volume>15</volume>
          <fpage>8539</fpage>
          <lpage>8546</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/36514745"/>
          </comment>
          <pub-id pub-id-type="doi">10.2147/IJGM.S385513</pub-id>
          <pub-id pub-id-type="medline">36514745</pub-id>
          <pub-id pub-id-type="pii">385513</pub-id>
          <pub-id pub-id-type="pmcid">PMC9741848</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Ding</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>Visceral fat area and body fat percentage measured by bioelectrical impedance analysis correlate with glycometabolism</article-title>
          <source>BMC Endocr Disord</source>
          <year>2022</year>
          <volume>22</volume>
          <issue>1</issue>
          <fpage>231</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcendocrdisord.biomedcentral.com/articles/10.1186/s12902-022-01142-z"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12902-022-01142-z</pub-id>
          <pub-id pub-id-type="medline">36109703</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12902-022-01142-z</pub-id>
          <pub-id pub-id-type="pmcid">PMC9479287</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gollapalli</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Alansari</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Alkhorasani</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Alsubaii</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Sakloua</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Alzahrani</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Al-Hariri</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Alfares</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>AlKhafaji</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Al Argan</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Albaker</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>A novel stacking ensemble for detecting three types of diabetes mellitus using a Saudi Arabian dataset: pre-diabetes, T1DM, and T2DM</article-title>
          <source>Comput Biol Med</source>
          <year>2022</year>
          <volume>147</volume>
          <fpage>105757</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S0010-4825(22)00531-5"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.compbiomed.2022.105757</pub-id>
          <pub-id pub-id-type="medline">35777087</pub-id>
          <pub-id pub-id-type="pii">S0010-4825(22)00531-5</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lai</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Keshavjee</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Guergachi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Gao</surname>
              <given-names>X</given-names>
            </name>
          </person-group>
          <article-title>Predictive models for diabetes mellitus using machine learning techniques</article-title>
          <source>BMC Endocr Disord</source>
          <year>2019</year>
          <volume>19</volume>
          <issue>1</issue>
          <fpage>101</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcendocrdisord.biomedcentral.com/articles/10.1186/s12902-019-0436-6"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12902-019-0436-6</pub-id>
          <pub-id pub-id-type="medline">31615566</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12902-019-0436-6</pub-id>
          <pub-id pub-id-type="pmcid">PMC6794897</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Hu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Cai</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Zuo</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Cheng</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Yan</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Machine learning for predicting the 3-year risk of incident diabetes in Chinese adults</article-title>
          <source>Front Public Health</source>
          <year>2021</year>
          <volume>9</volume>
          <fpage>626331</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/34268283"/>
          </comment>
          <pub-id pub-id-type="doi">10.3389/fpubh.2021.626331</pub-id>
          <pub-id pub-id-type="medline">34268283</pub-id>
          <pub-id pub-id-type="pmcid">PMC8275929</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fernandes Silva</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Hokkanen</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Vangipurapu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Oravilahti</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Laakso</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Metabolites as risk factors for diabetic retinopathy in patients with type 2 diabetes: a 12-year follow-up study</article-title>
          <source>J Clin Endocrinol Metab</source>
          <year>2023</year>
          <volume>109</volume>
          <issue>1</issue>
          <fpage>100</fpage>
          <lpage>106</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/37560996"/>
          </comment>
          <pub-id pub-id-type="doi">10.1210/clinem/dgad452</pub-id>
          <pub-id pub-id-type="medline">37560996</pub-id>
          <pub-id pub-id-type="pii">7240444</pub-id>
          <pub-id pub-id-type="pmcid">PMC10735554</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lamichhane</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Agrawal</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Abouainain</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Abousahle</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Regmi</surname>
              <given-names>PR</given-names>
            </name>
          </person-group>
          <article-title>Utility of neutrophil-to-high-density lipoprotein-cholesterol ratio in patients with coronary artery disease: a narrative review</article-title>
          <source>J Int Med Res</source>
          <year>2023</year>
          <volume>51</volume>
          <issue>4</issue>
          <fpage>3000605231166518</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://journals.sagepub.com/doi/abs/10.1177/03000605231166518?url_ver=Z39.88-2003&#38;rfr_id=ori:rid:crossref.org&#38;rfr_dat=cr_pub  0pubmed"/>
          </comment>
          <pub-id pub-id-type="doi">10.1177/03000605231166518</pub-id>
          <pub-id pub-id-type="medline">37038922</pub-id>
          <pub-id pub-id-type="pmcid">PMC10107976</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ahn</surname>
              <given-names>CH</given-names>
            </name>
            <name name-style="western">
              <surname>Yoon</surname>
              <given-names>JW</given-names>
            </name>
            <name name-style="western">
              <surname>Hahn</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Moon</surname>
              <given-names>MK</given-names>
            </name>
            <name name-style="western">
              <surname>Park</surname>
              <given-names>KS</given-names>
            </name>
            <name name-style="western">
              <surname>Cho</surname>
              <given-names>YM</given-names>
            </name>
          </person-group>
          <article-title>Evaluation of non-laboratory and laboratory prediction models for current and future diabetes mellitus: a cross-sectional and retrospective cohort study</article-title>
          <source>PLoS One</source>
          <year>2016</year>
          <volume>11</volume>
          <issue>5</issue>
          <fpage>e0156155</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0156155"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0156155</pub-id>
          <pub-id pub-id-type="medline">27214034</pub-id>
          <pub-id pub-id-type="pii">PONE-D-15-28825</pub-id>
          <pub-id pub-id-type="pmcid">PMC4877115</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mao</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Yip</surname>
              <given-names>CW</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>Complications of diabetes in China: health system and economic implications</article-title>
          <source>BMC Public Health</source>
          <year>2019</year>
          <volume>19</volume>
          <issue>1</issue>
          <fpage>269</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcpublichealth.biomedcentral.com/articles/10.1186/s12889-019-6569-8"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12889-019-6569-8</pub-id>
          <pub-id pub-id-type="medline">30841928</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12889-019-6569-8</pub-id>
          <pub-id pub-id-type="pmcid">PMC6414024</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Forbes</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ghazaleh</surname>
              <given-names>HA</given-names>
            </name>
            <name name-style="western">
              <surname>He</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Asaad</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Cheng</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Duaso</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Interventions and behaviour change techniques for improving physical activity level in working-age people (18-60 years) with type 2 diabetes: a systematic review and network meta-analysis</article-title>
          <source>Int J Nurs Stud</source>
          <year>2024</year>
          <volume>160</volume>
          <fpage>104884</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S0020-7489(24)00197-4"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.ijnurstu.2024.104884</pub-id>
          <pub-id pub-id-type="medline">39250878</pub-id>
          <pub-id pub-id-type="pii">S0020-7489(24)00197-4</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Nie</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Xia</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Yan</surname>
              <given-names>Q</given-names>
            </name>
          </person-group>
          <article-title>The prediction effect of HbA1c on nosocomial infection in diabetic patients was analyzed based on decision curve and dose response</article-title>
          <source>Altern Ther Health Med</source>
          <year>2024</year>
          <volume>30</volume>
          <issue>9</issue>
          <fpage>157</fpage>
          <lpage>161</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://alternative-therapies.com/oa/index.html?fid=9779"/>
          </comment>
          <pub-id pub-id-type="medline">38294751</pub-id>
          <pub-id pub-id-type="pii">AT9779</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kibirige</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Zawedde-Muyanja</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Andia-Biraro</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Olum</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Adakun</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Sekaggya-Wiltshire</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Kimuli</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>Diagnostic accuracy of two confirmatory tests for diabetes mellitus in adult Ugandans with recently diagnosed tuberculosis</article-title>
          <source>Ther Adv Infect Dis</source>
          <year>2023</year>
          <volume>10</volume>
          <fpage>20499361231216799</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://journals.sagepub.com/doi/10.1177/20499361231216799?url_ver=Z39.88-2003&#38;rfr_id=ori:rid:crossref.org&#38;rfr_dat=cr_pub  0pubmed"/>
          </comment>
          <pub-id pub-id-type="doi">10.1177/20499361231216799</pub-id>
          <pub-id pub-id-type="medline">38145193</pub-id>
          <pub-id pub-id-type="pii">10.1177_20499361231216799</pub-id>
          <pub-id pub-id-type="pmcid">PMC10748612</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lv</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Cui</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Fan</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Zha</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Ke</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Cui</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Detection of diabetic patients in people with normal fasting glucose using machine learning</article-title>
          <source>BMC Med</source>
          <year>2023</year>
          <volume>21</volume>
          <issue>1</issue>
          <fpage>342</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedicine.biomedcentral.com/articles/10.1186/s12916-023-03045-9"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12916-023-03045-9</pub-id>
          <pub-id pub-id-type="medline">37674168</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12916-023-03045-9</pub-id>
          <pub-id pub-id-type="pmcid">PMC10483877</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
