<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Archiving and Interchange DTD v2.3 20070202//EN" "archivearticle.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="systematic-review" dtd-version="2.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Endocrinol.</journal-id>
<journal-title>Frontiers in Endocrinology</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Endocrinol.</abbrev-journal-title>
<issn pub-type="epub">1664-2392</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fendo.2025.1495306</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Endocrinology</subject>
<subj-group>
<subject>Systematic Review</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Machine learning-based risk predictive models for diabetic kidney disease in type 2 diabetes mellitus patients: a systematic review and meta-analysis</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Li</surname>
<given-names>Yihan</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2750735"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Jin</surname>
<given-names>Nan</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Zhan</surname>
<given-names>Qiuzhong</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Huang</surname>
<given-names>Yue</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Sun</surname>
<given-names>Aochuan</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2361982"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Yin</surname>
<given-names>Fen</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2528360"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Li</surname>
<given-names>Zhuangzhuang</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2528124"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Hu</surname>
<given-names>Jiayu</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="author-notes" rid="fn001">
<sup>*</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2799589"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Liu</surname>
<given-names>Zhengtang</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="author-notes" rid="fn001">
<sup>*</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2044875"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>Department of Geriatrics, Xiyuan Hospital, China Academy of Traditional Chinese Medicine</institution>, <addr-line>Beijing</addr-line>, <country>China</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>Faculty of Chinese Medicine, Macau University of Science and Technology</institution>, <addr-line>Macao</addr-line>, &#xa0;<country>Macao SAR, China</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>Graduate School of Beijing University of Chinese Medicine</institution>, <addr-line>Beijing</addr-line>, <country>China</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>Edited by: Prasanna Santhanam, Johns Hopkins University, United States</p>
</fn>
<fn fn-type="edited-by">
<p>Reviewed by: Andreas Leiherer, Vorarlberg Institute for Vascular Investigation and Treatment (VIVIT), Austria</p>
<p>Roshan Kumar Mahat, Dharanidhar Medical College and Hospital, India</p>
</fn>
<fn fn-type="corresp" id="fn001">
<p>*Correspondence: Zhengtang Liu, <email xlink:href="mailto:doctorzht@126.com">doctorzht@126.com</email>; Jiayu Hu, <email xlink:href="mailto:hujiayu2018@126.com">hujiayu2018@126.com</email>
</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>03</day>
<month>03</month>
<year>2025</year>
</pub-date>
<pub-date pub-type="collection">
<year>2025</year>
</pub-date>
<volume>16</volume>
<elocation-id>1495306</elocation-id>
<history>
<date date-type="received">
<day>12</day>
<month>09</month>
<year>2024</year>
</date>
<date date-type="accepted">
<day>13</day>
<month>02</month>
<year>2025</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2025 Li, Jin, Zhan, Huang, Sun, Yin, Li, Hu and Liu</copyright-statement>
<copyright-year>2025</copyright-year>
<copyright-holder>Li, Jin, Zhan, Huang, Sun, Yin, Li, Hu and Liu</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<sec>
<title>Background</title>
<p>Machine learning (ML) models are being increasingly employed to predict the risk of developing and progressing diabetic kidney disease (DKD) in patients with type 2 diabetes mellitus (T2DM). However, the performance of these models still varies, which limits their widespread adoption and practical application. Therefore, we conducted a systematic review and meta-analysis to summarize and evaluate the performance and clinical applicability of these risk predictive models and to identify key research gaps.</p>
</sec>
<sec>
<title>Methods</title>
<p>We conducted a systematic review and meta-analysis to compare the performance of ML predictive models. We searched PubMed, Embase, the Cochrane Library, and Web of Science for English-language studies using ML algorithms to predict the risk of DKD in patients with T2DM, covering the period from database inception to April 18, 2024. The primary performance metric for the models was the area under the receiver operating characteristic curve (AUC) with a 95% confidence interval (CI). The risk of bias was assessed using the Prediction Model Risk of Bias Assessment Tool (PROBAST) checklist.</p>
</sec>
<sec>
<title>Results</title>
<p>26 studies that met the eligibility criteria were included into the meta-analysis. 25 studies performed internal validation, but only 8 studies conducted external validation. A total of 94 ML models were developed, with 81 models evaluated in the internal validation sets and 13 in the external validation sets. The pooled AUC was 0.839 (95% CI 0.787-0.890) in the internal validation and 0.830 (95% CI 0.784-0.877) in the external validation sets. Subgroup analysis based on the type of ML showed that the pooled AUC for traditional regression ML was 0.797 (95% CI 0.777-0.816), for ML was 0.811 (95% CI 0.785-0.836), and for deep learning was 0.863 (95% CI 0.825-0.900). A total of 26 ML models were included, and the AUCs of models that were used three or more times were pooled. Among them, the random forest (RF) models demonstrated the best performance with a pooled AUC of 0.848 (95% CI 0.785-0.911).</p>
</sec>
<sec>
<title>Conclusion</title>
<p>This meta-analysis demonstrates that ML exhibit high performance in predicting DKD risk in T2DM patients. However, challenges related to data bias during model development and validation still need to be addressed. Future research should focus on enhancing data transparency and standardization, as well as validating these models&#x2019; generalizability through multicenter studies.</p>
</sec>
<sec>
<title>Systematic Review Registration</title>
<p>
<uri xlink:href="https://inplasy.com/inplasy-2024-9-0038/">https://inplasy.com/inplasy-2024-9-0038/</uri>, identifier INPLASY202490038.</p>
</sec>
</abstract>
<kwd-group>
<kwd>machine learning</kwd>
<kwd>predictive model</kwd>
<kwd>type 2 diabetes mellitus</kwd>
<kwd>diabetic kidney disease</kwd>
<kwd>meta-analysis</kwd>
<kwd>systematic review</kwd>
</kwd-group>
<contract-sponsor id="cn001">National Key Research and Development Program of China<named-content content-type="fundref-id">10.13039/501100012166</named-content>
</contract-sponsor>
<counts>
<fig-count count="3"/>
<table-count count="2"/>
<equation-count count="0"/>
<ref-count count="85"/>
<page-count count="17"/>
<word-count count="8328"/>
</counts>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-in-acceptance</meta-name>
<meta-value>Clinical Diabetes</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec id="s1" sec-type="intro">
<label>1</label>
<title>Introduction</title>
<p>Diabetic kidney disease (DKD) is one of the major microvascular complications of type 2 diabetes mellitus (T2DM), characterized by both structural and functional renal impairment resulting from chronic hyperglycemia. The global incidence of T2DM has shown a marked increase, which has been paralleled by a rising prevalence of DKD (<xref ref-type="bibr" rid="B1">1</xref>, <xref ref-type="bibr" rid="B2">2</xref>). It is estimated that approximately 20% to 40% of individuals with diabetes will eventually develop DKD (<xref ref-type="bibr" rid="B1">1</xref>, <xref ref-type="bibr" rid="B3">3</xref>). DKD remains a leading cause of end-stage renal disease (ESRD) worldwide (<xref ref-type="bibr" rid="B4">4</xref>&#x2013;<xref ref-type="bibr" rid="B6">6</xref>). The presence and severity of DKD have been demonstrated to significantly elevate the risk of adverse health outcomes, including premature mortality, in patients with T2DM (<xref ref-type="bibr" rid="B7">7</xref>). This poses a substantial challenge to global public health. Consequently, the early identification of individuals at high risk for DKD is critical for implementing targeted interventions and improving clinical prognosis.</p>
<p>Conventional risk prediction models for DKD, such as linear regression, estimate risk by calculating a weighted sum of known risk factors (<xref ref-type="bibr" rid="B8">8</xref>&#x2013;<xref ref-type="bibr" rid="B10">10</xref>). While these models are effective when a limited number of variables or predictors are involved, they face significant limitations in capturing the complex nonlinear relationships and interactions among multidimensional risk factors (<xref ref-type="bibr" rid="B11">11</xref>, <xref ref-type="bibr" rid="B12">12</xref>). In contrast, ML methods that leverage big data or multidimensional datasets offer substantial promise in improving predictive accuracy (<xref ref-type="bibr" rid="B13">13</xref>). Recently, machine learning (ML) has demonstrated considerable advantages in the early detection and effective management of diseases (<xref ref-type="bibr" rid="B14">14</xref>&#x2013;<xref ref-type="bibr" rid="B18">18</xref>). On one hand, ML can efficiently process vast amounts of data at relatively low costs; on the other hand, it can analyze these datasets to generate hypotheses and uncover latent patterns. Specifically, ML techniques have the capacity to extract common features from diverse data sources, such as text, images, behavioral data, and physiological indicators, thereby unveiling the intricate relationships between DKD and various contributing factors (<xref ref-type="bibr" rid="B19">19</xref>).</p>
<p>DKD is clinically diagnosed based on the albuminuria and the estimation of glomerular filtration rate (eGFR). However, DKD often has an insidious onset, with many patients being diagnosed only after irreversible renal damage has already occurred (<xref ref-type="bibr" rid="B4">4</xref>, <xref ref-type="bibr" rid="B20">20</xref>). Recent studies have demonstrated that DKD is associated with a variety of metabolites, including those found in plasma, serum, urine, and mitochondria (<xref ref-type="bibr" rid="B21">21</xref>). Additionally, genetic variants linked to diabetes are frequently correlated with an increased risk of developing DKD (<xref ref-type="bibr" rid="B22">22</xref>). Retinal microvascular changes, such as retinopathy, vascular stenosis, dilation, and tortuosity, have also been shown to be associated with DKD (<xref ref-type="bibr" rid="B23">23</xref>). The potential of ML lies in its ability to integrate and analyze multidimensional data from diverse domains, including clinical, genetic, proteomic, metabolomic, and imaging information (<xref ref-type="bibr" rid="B24">24</xref>, <xref ref-type="bibr" rid="B25">25</xref>). This capability holds significant promise for enhancing the accuracy of DKD risk prediction. Previous studies have demonstrated the feasibility of employing ML techniques to utilize various date types for identifying and predicting the risk of DKD in T2DM patients (<xref ref-type="bibr" rid="B26">26</xref>, <xref ref-type="bibr" rid="B27">27</xref>).</p>
<p>In summary, ML algorithms hold potential value in predicting DKD risk. However, considering the diversity of ML algorithms, the initial differences in dataset characteristics, and the variations in sample sizes, the heterogeneity among studies cannot be overlooked. Moreover, although ML has garnered significant attention within the medical field, its robustness in clinical practice remains uncertain, and its widespread adoption and application are somewhat constrained. Therefore, in this systematic review and meta-analysis, we aimed to comprehensively integrate and evaluate the performance and clinical applicability of published ML-based models for predicting the DKD risk in T2DM patients. And hope to provide more reliable reference for clinical practice.</p>
</sec>
<sec id="s2" sec-type="materials|methods">
<label>2</label>
<title>Materials and methods</title>
<sec id="s2_1">
<label>2.1</label>
<title>Study design</title>
<p>This systematic review and meta-analysis were conducted in accordance with the guidelines recommended by the Cochrane Collaboration and the Preferred Reporting Items for Systematic Reviews and Meta-Analyses of Diagnostic Test Accuracy Studies (PRISMA-DTA) statement (<xref ref-type="bibr" rid="B28">28</xref>). The Checklist for Critical Appraisal and Data Extraction for Systematic Reviews of Prediction Modelling Studies (CHARMS) was employed to define the objectives of this systematic review and meta-analysis (<xref ref-type="bibr" rid="B29">29</xref>). The protocol for this systematic review and meta-analysis has been registered <italic>a priori</italic> at the International Platform of Registered Systematic Review and Meta-analysis Protocols (INPLASY) (<xref ref-type="bibr" rid="B30">30</xref>). (Registration: INPLASY202490038, <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.37766/inplasy2024.9.0038">https://doi.org/10.37766/inplasy2024.9.0038</ext-link>).</p>
</sec>
<sec id="s2_2">
<label>2.2</label>
<title>Date sources and search strategy</title>
<p>We aimed to compile predictive models for the DKD risk in T2DM patients based on ML algorithms, with the goal of evaluating their performance. With the assistance of information specialists, we conducted a comprehensive search across the following databases: PubMed, Embase, Cochrane Library, and Web of Science Core Collection. We included all relevant English-language publications up to April 18, 2024. Both controlled vocabulary terms (MeSH terms in Embase and PubMed) and free-text terms were employed using Boolean operators. The detailed search strategy is outlined in <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table&#xa0;1</bold>
</xref>.</p>
</sec>
<sec id="s2_3">
<label>2.3</label>
<title>Inclusion criteria</title>
<p>We included studies that evaluated the predictive performance of ML algorithms in assessing the DKD risk in T2DM patients, focusing on those that met the &#x201c;PICOS&#x201d; inclusion criteria.</p>
<sec id="s2_3_1">
<label>2.3.1</label>
<title>Participants</title>
<p>The participants were diagnosed with T2DM (<xref ref-type="bibr" rid="B31">31</xref>), with no eligibility restrictions based on gender, age, ethnicity, or geographical location. Studies focusing on other types of diabetes were excluded from this review.</p>
</sec>
<sec id="s2_3_2">
<label>2.3.2</label>
<title>Intervention</title>
<p>Studies were included if they explicitly specified the application of clinical prediction models based on ML algorithms in T2DM patients. This included all relevant synonyms and methodologies related to ML, such as &#x201c;supervised machine learning&#x201d;, &#x201c;unsupervised machine learning&#x201d;, &#x201c;deep learning&#x201d;, &#x201c;neural networks&#x201d; and &#x201c;support vector machines&#x201d;. Consequently, studies that did not employ ML algorithms or those where ML was applied in nonclinical settings were excluded.</p>
</sec>
<sec id="s2_3_3">
<label>2.3.3</label>
<title>Comparators</title>
<p>We included studies that compared ML algorithms with other ML algorithms, traditional statistical analyses, clinical scoring tools, and manual diagnoses with or without clinical scoring tools. Studies that solely used traditional statistical prediction tools or relied exclusively on unaided clinical performance were excluded.</p>
</sec>
<sec id="s2_3_4">
<label>2.3.4</label>
<title>Outcomes</title>
<p>The primary outcome indicator is the risk of developing DKD in T2DM patients (<xref ref-type="bibr" rid="B1">1</xref>). Included studies must report model performance metrics, specifically area under the receiver operating characteristic curve (AUC).</p>
</sec>
<sec id="s2_3_5">
<label>2.3.5</label>
<title>Study</title>
<p>Cohort studies, case-cohort studies, case-control studies and nested case-control studies.</p>
</sec>
</sec>
<sec id="s2_4">
<label>2.4</label>
<title>Exclusion criteria</title>
<p>We excluded studies in the form of review articles, meta-analysis, case reports, conference abstracts, guidelines, editorials, commentaries, expert opinions, letters, and animal studies. Additionally, studies employing simple algorithms instead of ML were excluded. We also excluded studies that merely analyzed influencing factors without constructing a ML risk mode. Furthermore, studies that used ML exclusively for image recognition without developing a predictive model were excluded. In case where multiple studies used the same or overlapping patient datasets, only the most recent study was included.</p>
</sec>
<sec id="s2_5">
<label>2.5</label>
<title>Study selection</title>
<p>Firstly, the retrieved studies were imported into EndNote software for reference management where duplicate references were identified and removed. Secondly, two independent reviewers (Y.H. Li and N. Jin) performed a preliminary screening of the titles and abstracts of the included studies. This screening focused on selecting only those studies pertinent to the use of ML algorithms for risk prediction of DKD in T2DM patients. Note that two reviewers are required to independently evaluate the full research report and apply predefined inclusion and exclusion criteria to determine eligibility. Additionally, we manually searched the references of the included studies to identify any other potentially eligible studies. In cases of disagreement regarding the inclusion of a study during the screening process, consensus was achieved through discussion or by consulting a third independent reviewers (Q.Z. Zhan) for arbitration.</p>
</sec>
<sec id="s2_6">
<label>2.6</label>
<title>Date extraction</title>
<p>We employed the CHARMS checklist and the Transparent Reporting of a multivariable prediction model for Individual Prognosis or Diagnosis (TRIPOD) guidelines to develop standardized forms for data extraction (<xref ref-type="bibr" rid="B29">29</xref>, <xref ref-type="bibr" rid="B32">32</xref>). Two independent reviewers (Y.H. Li and N. Jin) extracted data from the studies that were ultimately included. Notably, during the extraction process, if a single study reported multiple performance outcomes for the same ML model, we selected the best result. Additionally, if a study included two or more models, we extracted performance metrics for each model. Specifically, the following information was extracted from each study: first author, year of publication, country, data source, study design, research objectives, sample size, participant characteristics, age, gender distribution, type of prediction, type of ML model, category of predictive factors, model development and validation processes, and model performance metrics. The primary performance metrics of the included models typically included the area under the AUC, C-statistic, sensitivity, specificity, accuracy, F1 score, positive predictive value (PPV), and negative predictive value (NPV). In our study, AUC and the associated 95% confidence intervals (CI) were primarily used as the key metrics for evaluating model performance. If necessary, we attempted to contact the study authors for additional detailed information.</p>
</sec>
<sec id="s2_7">
<label>2.7</label>
<title>Risk of bias assessment</title>
<p>We assessed the risk of bias in the prediction models using the Prediction Model Risk of Bias Assessment Tool (PROBAST) (<xref ref-type="bibr" rid="B33">33</xref>), which is specifically designed for studies involving multivariable prediction models for individual prognosis or diagnosis. This tool assesses four domains: participants, predictors, outcomes, and statistical analysis. Each domain includes 2 to 9 key questions, with responses categorized as &#x201c;Yes&#x201d;/&#x201d;Probably Yes&#x201d;, &#x201c;No&#x201d;/&#x201d;Probably No&#x201d;, or &#x201c;Unclear&#x201d;. If at least one question within a domain is rated as &#x201c;No&#x201d; or &#x201c;Probably No&#x201d; the domain is considered high risk. Conversely, if all questions are rated as &#x201c;Yes&#x201d; or &#x201c;Probably Yes&#x201d; the domain is deemed low risk. When all domains are assessed as low risk, the overall risk of bias is categorized as low. If at least one domain is considered high risk, the overall risk of bias is rated as high. If the assessment is uncertain, the overall risk is marked as unclear. Similarly, this section was evaluated by two independent reviewers (Y.H. Li and N. Jin), who cross-checked their results. In cases of disagreement, a third reviewer (Q.Z. Zhan) was consulted to make the final decision.</p>
</sec>
<sec id="s2_8">
<label>2.8</label>
<title>Statistical analysis</title>
<p>We conducted a meta-analysis, pooling the AUC values and their 95% CIs from individual studies, and performed stratified analyses based on study design, model type, and other relevant factors. If the AUC did not report a 95% CI or standard error (SE), we estimated the SE and 95% CI using the Hanley and McNeil formula (<xref ref-type="bibr" rid="B34">34</xref>&#x2013;<xref ref-type="bibr" rid="B36">36</xref>). Given the high heterogeneity among the included studies due to variations in study design, ML models, predictive factors, and parameters, we used the Der Simonian and Laird random-effects model to pool the AUCs in the meta-analysis (<xref ref-type="bibr" rid="B37">37</xref>). Additionally, we calculated the 95% prediction interval (PI) to characterize the degree of heterogeneity among studies and to assess the potential range of the predictive model&#x2019;s performance in future studies. The results were presented in the form of a forest plot. Moreover, we assessed the degree of heterogeneity between studies using the Cochrane Q test and <italic>I&#xb2;</italic> statistic to determine the suitability of a fixed-effects model (<italic>P</italic> &lt; 0.10 or <italic>I</italic>&#xb2; &gt; 25%) (<xref ref-type="bibr" rid="B38">38</xref>). It is important to note that when the 95% CI or PI of the pooled AUC includes 0.5, we consider there to be insufficient evidence to demonstrate statistically significant discriminatory ability of the prediction model for DKD occurrence in the populations included in the meta-analysis. AUC values were classified as follows: &lt;0.60 as inadequate, 0.60&#x2013;0.70 as moderate, 0.70&#x2013;0.80 as acceptable, and &gt;0.80 as excellent. All statistical analyses were conducted using STATA version 18. Statistical significance was defined as a <italic>P</italic>-value less than 0.05, with a threshold of 0.10 for heterogeneity testing.</p>
</sec>
</sec>
<sec id="s3" sec-type="results">
<label>3</label>
<title>Results</title>
<sec id="s3_1">
<label>3.1</label>
<title>Study selection</title>
<p>In this study, two independent reviewers (Y.H. Li and N. Jin) conducted a comprehensive screening and integration of the data. The inter-rater reliability was assessed using the Kappa coefficient, which indicated substantial agreement between the two reviewers (kappa = 0.82).</p>
<p>A total of 1260 studies were identified through a systematic search of the predetermined electronic databases, based on the established search strategy. Specifically, we retrieved 218 records from PubMed, 174 records from the Cochrane Library, 494 records from Web of Science, and 374 records from Embase. Additionally, we identified 9 studies through reference list reviews. Subsequently, after removing duplicates, 877 studies remained. We screened these studies by reviewing titles and abstracts, excluding 754 studies that either reported irrelevant topics or lacked predefined outcomes. The remaining 123 studies were further assessed through full-text review. Finally, 26 studies meeting the inclusion and exclusion criteria were included for meta-analysis (<xref ref-type="bibr" rid="B26">26</xref>, <xref ref-type="bibr" rid="B27">27</xref>, <xref ref-type="bibr" rid="B39">39</xref>&#x2013;<xref ref-type="bibr" rid="B62">62</xref>). A flowchart of the study search and selection process is detailed in <xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1</bold>
</xref>, and search information from each electronic database is provided in <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table&#xa0;1</bold>
</xref>.</p>
<fig id="f1" position="float">
<label>Figure&#xa0;1</label>
<caption>
<p>Study search and selection flowchart. Flowchart according to the Preferred Reporting Items for Systematic Reviews and Meta-Analyses (PRISMA 2020). <italic>n</italic>= number of studies/records/reports.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fendo-16-1495306-g001.tif"/>
</fig>
</sec>
<sec id="s3_2">
<label>3.2</label>
<title>Study characteristics</title>
<p>Among the 26 studies included, 14 were from China (<xref ref-type="bibr" rid="B39">39</xref>&#x2013;<xref ref-type="bibr" rid="B41">41</xref>, <xref ref-type="bibr" rid="B43">43</xref>, <xref ref-type="bibr" rid="B48">48</xref>, <xref ref-type="bibr" rid="B49">49</xref>, <xref ref-type="bibr" rid="B51">51</xref>&#x2013;<xref ref-type="bibr" rid="B53">53</xref>, <xref ref-type="bibr" rid="B55">55</xref>, <xref ref-type="bibr" rid="B59">59</xref>, <xref ref-type="bibr" rid="B60">60</xref>), 4 from the United States (<xref ref-type="bibr" rid="B42">42</xref>, <xref ref-type="bibr" rid="B50">50</xref>, <xref ref-type="bibr" rid="B56">56</xref>, <xref ref-type="bibr" rid="B58">58</xref>), 3 from Singapore (<xref ref-type="bibr" rid="B26">26</xref>, <xref ref-type="bibr" rid="B44">44</xref>, <xref ref-type="bibr" rid="B45">45</xref>), 3 from Iran (<xref ref-type="bibr" rid="B46">46</xref>, <xref ref-type="bibr" rid="B47">47</xref>, <xref ref-type="bibr" rid="B54">54</xref>), and 1 each from Italy (<xref ref-type="bibr" rid="B27">27</xref>) and Bangladesh (<xref ref-type="bibr" rid="B57">57</xref>). Only one study was published in 2013 (<xref ref-type="bibr" rid="B61">61</xref>), while the rest were published in the past five years. All studies were predominantly retrospective, comprising 14 cohort studies (<xref ref-type="bibr" rid="B26">26</xref>, <xref ref-type="bibr" rid="B41">41</xref>, <xref ref-type="bibr" rid="B42">42</xref>, <xref ref-type="bibr" rid="B46">46</xref>, <xref ref-type="bibr" rid="B48">48</xref>&#x2013;<xref ref-type="bibr" rid="B52">52</xref>, <xref ref-type="bibr" rid="B55">55</xref>, <xref ref-type="bibr" rid="B56">56</xref>, <xref ref-type="bibr" rid="B58">58</xref>, <xref ref-type="bibr" rid="B61">61</xref>, <xref ref-type="bibr" rid="B62">62</xref>), 9 cross-sectional studies (<xref ref-type="bibr" rid="B39">39</xref>, <xref ref-type="bibr" rid="B40">40</xref>, <xref ref-type="bibr" rid="B45">45</xref>, <xref ref-type="bibr" rid="B47">47</xref>, <xref ref-type="bibr" rid="B53">53</xref>, <xref ref-type="bibr" rid="B54">54</xref>, <xref ref-type="bibr" rid="B57">57</xref>, <xref ref-type="bibr" rid="B59">59</xref>, <xref ref-type="bibr" rid="B60">60</xref>), and 3 case-control studies (<xref ref-type="bibr" rid="B27">27</xref>, <xref ref-type="bibr" rid="B43">43</xref>, <xref ref-type="bibr" rid="B44">44</xref>). The basic characteristics of each study are detailed in <xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref>.</p>
<table-wrap id="T1" position="float">
<label>Table&#xa0;1</label>
<caption>
<p>Characteristics of studies included in the systematic review and meta-analysis.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" align="center">Study</th>
<th valign="middle" align="center">Country</th>
<th valign="middle" align="center">Study Type</th>
<th valign="middle" align="center">model</th>
<th valign="middle" align="center">Sample Size</th>
<th valign="middle" align="center">Male/<break/>Female</th>
<th valign="middle" align="center">Age</th>
<th valign="middle" align="center">Predictors</th>
<th valign="middle" align="center">Machine Learning</th>
<th valign="middle" align="center">Performance Evaluation</th>
<th valign="middle" align="center">Validation</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Zhao et&#xa0;al. (2023) (<xref ref-type="bibr" rid="B39">39</xref>)</td>
<td valign="top" align="center">China</td>
<td valign="top" align="center">Cross</td>
<td valign="top" align="center">DI</td>
<td valign="top" align="center">Total: 678<break/>Training:202<break/>Internal validation:87<break/>External validation:389</td>
<td valign="top" align="center">467/211</td>
<td valign="top" align="center">54.1 &#xb1; 11.8</td>
<td valign="top" align="center">MH+LE</td>
<td valign="top" align="center">LR</td>
<td valign="top" align="center">AUC, Accuracy, Sensitivity, Jordan index</td>
<td valign="top" align="center">INV+EXV</td>
</tr>
<tr>
<td valign="top" align="left">Liu et&#xa0;al. (2020) (<xref ref-type="bibr" rid="B40">40</xref>)</td>
<td valign="top" align="center">China</td>
<td valign="top" align="center">Cross</td>
<td valign="top" align="center">DI</td>
<td valign="top" align="center">Total: 1485(10-fold cross)<break/>Training:<break/>Internal validation:</td>
<td valign="top" align="center">N/A</td>
<td valign="top" align="center">N/A</td>
<td valign="top" align="center">DC+LE+CI</td>
<td valign="top" align="center">BN, BN-wopi, NB, RF, DT</td>
<td valign="top" align="center">AUC, Sensitivity, Specificity</td>
<td valign="top" align="center">INV</td>
</tr>
<tr>
<td valign="top" align="left">Hui et&#xa0;al. (2023) (<xref ref-type="bibr" rid="B41">41</xref>)</td>
<td valign="top" align="center">China</td>
<td valign="top" align="center">Cohort</td>
<td valign="top" align="center">DI</td>
<td valign="top" align="center">Training:241</td>
<td valign="top" align="center">100/141</td>
<td valign="top" align="center">52.57 &#xb1; 10.65</td>
<td valign="top" align="center">MH+LE</td>
<td valign="top" align="center">LASSO</td>
<td valign="top" align="center">AUC, Precision score, Recall score, Accuracy</td>
<td valign="top" align="center">INV</td>
</tr>
<tr>
<td valign="top" align="left">Momenzadeh et&#xa0;al. (2022) (<xref ref-type="bibr" rid="B42">42</xref>)</td>
<td valign="top" align="center">USA</td>
<td valign="top" align="center">Cohort</td>
<td valign="top" align="center">PR</td>
<td valign="top" align="center">Total: 10468<break/>Training:8388<break/>Internal validation: 2097</td>
<td valign="top" align="center">5067/5401</td>
<td valign="top" align="center">57.7(48.3-68.3)</td>
<td valign="top" align="center">DC+LE+SH</td>
<td valign="top" align="center">SVC, GBDT, ET, AdaBoost, RF, LR</td>
<td valign="top" align="center">AUC</td>
<td valign="top" align="center">INV</td>
</tr>
<tr>
<td valign="top" align="left">Cai et&#xa0;al. (2024) (<xref ref-type="bibr" rid="B43">43</xref>)</td>
<td valign="top" align="center">China</td>
<td valign="top" align="center">Case</td>
<td valign="top" align="center">DI</td>
<td valign="top" align="center">Total: 210<break/>Training:147<break/>Internal validation:63</td>
<td valign="top" align="center">87/123</td>
<td valign="top" align="center">57.42 &#xb1; 8.15</td>
<td valign="top" align="center">MH+LE+CI</td>
<td valign="top" align="center">DT, RF</td>
<td valign="top" align="center">AUC, sensitivity, specificity, accuracy, recall, precision</td>
<td valign="top" align="center">INV</td>
</tr>
<tr>
<td valign="top" align="left">Betzler et&#xa0;al. (2023) (<xref ref-type="bibr" rid="B44">44</xref>)</td>
<td valign="top" align="center">Singapore</td>
<td valign="top" align="center">Case</td>
<td valign="top" align="center">DI</td>
<td valign="top" align="center">Training:13284(5-fold cross)<break/>Internal validation (5-fold cross); External validation: SEED:1969; SMART2D:712</td>
<td valign="top" align="center">6758/6526<break/>1047/922<break/>380/332</td>
<td valign="top" align="center">64.1 &#xb1; 10.8<break/>64.0 &#xb1; 9.2<break/>57.4 &#xb1; 10.7</td>
<td valign="top" align="center">DC+MH+LE+RP</td>
<td valign="top" align="center">DL</td>
<td valign="top" align="center">AUC, sensitivity, specificity, PPV, NPV</td>
<td valign="top" align="center">INV+EXV</td>
</tr>
<tr>
<td valign="top" align="left">He et&#xa0;al. (2024) (<xref ref-type="bibr" rid="B45">45</xref>)</td>
<td valign="top" align="center">Singapore</td>
<td valign="top" align="center">Cross</td>
<td valign="top" align="center">DI</td>
<td valign="top" align="center">Total: 2772(5-fold cross)<break/>Training:2219<break/>Internal validation:553<break/>External validation:5843</td>
<td valign="top" align="center">1411/1361<break/>3753/2090</td>
<td valign="top" align="center">61.7(53.5-69.4)<break/>61.0(55.0-65.0)</td>
<td valign="top" align="center">DC+MH+DD+PD+SH+LE</td>
<td valign="top" align="center">LASSO, GBDT, LR</td>
<td valign="top" align="center">AUC, sensitivity, specificity</td>
<td valign="top" align="center">INV+EXV</td>
</tr>
<tr>
<td valign="top" align="left">Hosseini Sarkhosh et&#xa0;al. (2023) (<xref ref-type="bibr" rid="B46">46</xref>)</td>
<td valign="top" align="center">Iran</td>
<td valign="top" align="center">Cohort</td>
<td valign="top" align="center">PR</td>
<td valign="top" align="center">Total: 1907<break/>Training:1526<break/>Internal validation:381<break/>External validation:1543</td>
<td valign="top" align="center">854/1053<break/>683/860</td>
<td valign="top" align="center">58.4 &#xb1; 9.4<break/>58.63 &#xb1; 9.24</td>
<td valign="top" align="center">DD+MH+CI</td>
<td valign="top" align="center">LR</td>
<td valign="top" align="center">AUC, accuracy, precision, f1score</td>
<td valign="top" align="center">INV+EXV</td>
</tr>
<tr>
<td valign="top" align="left">Afrash et&#xa0;al. (2022) (<xref ref-type="bibr" rid="B47">47</xref>)</td>
<td valign="top" align="center">Iran</td>
<td valign="top" align="center">Cross</td>
<td valign="top" align="center">DI</td>
<td valign="top" align="center">Total: 327 (5-fold cross)<break/>Training:<break/>Internal validation:</td>
<td valign="top" align="center">176/151</td>
<td valign="top" align="center">54.7 &#xb1; 3.8<break/>68.23 &#xb1; 5.6</td>
<td valign="top" align="center">DC+DD+LE+PE</td>
<td valign="top" align="center">DT</td>
<td valign="top" align="center">sensitivity, spec-ificity, accuracy</td>
<td valign="top" align="center">INV</td>
</tr>
<tr>
<td valign="top" align="left">Yang et&#xa0;al. (2024) (<xref ref-type="bibr" rid="B48">48</xref>)</td>
<td valign="top" align="center">China</td>
<td valign="top" align="center">Cohort</td>
<td valign="top" align="center">DI</td>
<td valign="top" align="center">Total: 162<break/>Training: 114<break/>Internal validation: 49</td>
<td valign="top" align="center">100/63</td>
<td valign="top" align="center">58 &#xb1; 12</td>
<td valign="top" align="center">RS</td>
<td valign="top" align="center">DL</td>
<td valign="top" align="center">ROC, accuracy, specificity, sensitivity, PPV, NPV</td>
<td valign="top" align="center">INV</td>
</tr>
<tr>
<td valign="top" align="left">Yin et&#xa0;al. (2024) (<xref ref-type="bibr" rid="B49">49</xref>)</td>
<td valign="top" align="center">China</td>
<td valign="top" align="center">Cohort</td>
<td valign="top" align="center">DI</td>
<td valign="top" align="center">Total: 562 (10-fold cross)<break/>Training: 9 subsets<break/>Internal validation: 1 subset</td>
<td valign="top" align="center">N/A</td>
<td valign="top" align="center">N/A</td>
<td valign="top" align="center">MH+DD+PD+PE+LE</td>
<td valign="top" align="center">XGB, RF, DT, LR</td>
<td valign="top" align="center">AUC-ROC, Accuracy</td>
<td valign="top" align="center">INV</td>
</tr>
<tr>
<td valign="top" align="left">Song et&#xa0;al. (2020) (<xref ref-type="bibr" rid="B50">50</xref>)</td>
<td valign="top" align="center">USA</td>
<td valign="top" align="center">Cohort</td>
<td valign="top" align="center">PR</td>
<td valign="top" align="center">Total: 14039<break/>Training: 11231<break/>Internal validation: 2808</td>
<td valign="top" align="center">6786/7253</td>
<td valign="top" align="center">58 &#xb1; 18</td>
<td valign="top" align="center">DC+LE+PE+RS+SH</td>
<td valign="top" align="center">GBM</td>
<td valign="top" align="center">AUROC, AUPRC</td>
<td valign="top" align="center">INV</td>
</tr>
<tr>
<td valign="top" align="left">Fan et&#xa0;al. (2021) (<xref ref-type="bibr" rid="B51">51</xref>)</td>
<td valign="top" align="center">China</td>
<td valign="top" align="center">Cohort</td>
<td valign="top" align="center">DI</td>
<td valign="top" align="center">Total: 165<break/>Training: 132<break/>Internal validation:33</td>
<td valign="top" align="center">97/68</td>
<td valign="top" align="center">N/A</td>
<td valign="top" align="center">DC+MH+FH+DD+PD</td>
<td valign="top" align="center">BN, CHAID, D, XF</td>
<td valign="top" align="center">AUC, NPV, PPV, accuracy.</td>
<td valign="top" align="center">INV</td>
</tr>
<tr>
<td valign="top" align="left">Zhang et&#xa0;al. (2022) (<xref ref-type="bibr" rid="B52">52</xref>)</td>
<td valign="top" align="center">China</td>
<td valign="top" align="center">Cohort</td>
<td valign="top" align="center">DI</td>
<td valign="top" align="center">Total: 929(5-fold cross)<break/>Training: 743<break/>Internal validation:186<break/>External validation:329</td>
<td valign="top" align="center">608/321<break/>234/94</td>
<td valign="top" align="center">51.34 &#xb1; 10.02<break/>51.83 &#xb1; 9.66</td>
<td valign="top" align="center">DD+CI+LE+FH</td>
<td valign="top" align="center">RF, SVM</td>
<td valign="top" align="center">AUC, Accuracy, Sensitivity, Specificity, PPV, NPV, Balanced accuracy</td>
<td valign="top" align="center">INV+EXV</td>
</tr>
<tr>
<td valign="top" align="left">Liu et&#xa0;al. (2023) (<xref ref-type="bibr" rid="B53">53</xref>)</td>
<td valign="top" align="center">China</td>
<td valign="top" align="center">Cross</td>
<td valign="top" align="center">DI</td>
<td valign="top" align="center">Total: 3624<break/>Training: 2899<break/>Internal validation:725</td>
<td valign="top" align="center">2034/1590</td>
<td valign="top" align="center">59 &#xb1; 9.0</td>
<td valign="top" align="center">DC+SH+PE+LE</td>
<td valign="top" align="center">CatBoost, GBM, XGBoost, ET, GBDT, RF, LDA, LR, QDA, AdaBoost, NB, KNN, DT, SVM, RC</td>
<td valign="top" align="center">AUC, Accuracy</td>
<td valign="top" align="center">INV</td>
</tr>
<tr>
<td valign="top" align="left">Hosseini Sarkhosh et&#xa0;al. (2022) (<xref ref-type="bibr" rid="B54">54</xref>)</td>
<td valign="top" align="center">Iran</td>
<td valign="top" align="center">Cross</td>
<td valign="top" align="center">DI</td>
<td valign="top" align="center">Total: 6235<break/>Training: 4988<break/>Internal validation:1247</td>
<td valign="top" align="center">2754/3481</td>
<td valign="top" align="center">57.6 &#xb1; 11.9</td>
<td valign="top" align="center">DC+DD+LE+PE+CI</td>
<td valign="top" align="center">DT, SVM, LR, RF, XGBoost</td>
<td valign="top" align="center">AUC</td>
<td valign="top" align="center">INV</td>
</tr>
<tr>
<td valign="top" align="left">Dong et&#xa0;al. (2022) (<xref ref-type="bibr" rid="B55">55</xref>)</td>
<td valign="top" align="center">China</td>
<td valign="top" align="center">Cohort</td>
<td valign="top" align="center">PR</td>
<td valign="top" align="center">Total: 2809<break/>Training: 652<break/>Internal validation:164</td>
<td valign="top" align="center">585/231</td>
<td valign="top" align="center">56(48.3-65.0)</td>
<td valign="top" align="center">DC+LE+PE</td>
<td valign="top" align="center">GBM, XGBoost, AdaBoost, ANN, DT, SVM, LR</td>
<td valign="top" align="center">AUC, sensitivity, specificity, accuracy, F1</td>
<td valign="top" align="center">INV</td>
</tr>
<tr>
<td valign="top" align="left">Nicolucci et&#xa0;al. (2022) (<xref ref-type="bibr" rid="B27">27</xref>)</td>
<td valign="top" align="center">Italy</td>
<td valign="top" align="center">Case</td>
<td valign="top" align="center">PR</td>
<td valign="top" align="center">Total: 147664(Ten-fold Cross)<break/>Training: nine folds<break/>Internal validation: one fold</td>
<td valign="top" align="center">N/A</td>
<td valign="top" align="center">N/A</td>
<td valign="top" align="center">N/A</td>
<td valign="top" align="center">XGBoost</td>
<td valign="top" align="center">AUC, accuracy, sensitivity, specificity</td>
<td valign="top" align="center">INV+EXV</td>
</tr>
<tr>
<td valign="top" align="left">Sabanayagam et&#xa0;al. (2023) (<xref ref-type="bibr" rid="B26">26</xref>)</td>
<td valign="top" align="center">Singapore</td>
<td valign="top" align="center">Cohort</td>
<td valign="top" align="center">PR</td>
<td valign="top" align="center">Total: 1365<break/>Training: 652<break/>Internal validation:164</td>
<td valign="top" align="center">698/667</td>
<td valign="top" align="center">58.74 &#xb1; 8.95</td>
<td valign="top" align="center">DC+MH+PD+CI+LE+PE</td>
<td valign="top" align="center">LASSO, EN, GBDT</td>
<td valign="top" align="center">AUC</td>
<td valign="top" align="center">INV</td>
</tr>
<tr>
<td valign="top" align="left">Allen et&#xa0;al. (2022) (<xref ref-type="bibr" rid="B56">56</xref>)</td>
<td valign="top" align="center">USA</td>
<td valign="top" align="center">Cohort</td>
<td valign="top" align="center">PR</td>
<td valign="top" align="center">Total: 87963<break/>Training: 62994<break/>Internal validation:17323<break/>Hold-out testing sets: 7656<break/>External validation: 23073</td>
<td valign="top" align="center">N/A</td>
<td valign="top" align="center">N/A</td>
<td valign="top" align="center">DC+MH+LE+SH+FH</td>
<td valign="top" align="center">RF, XGBoost</td>
<td valign="top" align="center">AUC, Sensitivity Specificity<break/>Positive and negative likelihood ratios, DOR</td>
<td valign="top" align="center">INV+EXV</td>
</tr>
<tr>
<td valign="top" align="left">Maniruzzaman et&#xa0;al. (2021) (<xref ref-type="bibr" rid="B57">57</xref>)</td>
<td valign="top" align="center">Bangladesh</td>
<td valign="top" align="center">Cross</td>
<td valign="top" align="center">DI</td>
<td valign="top" align="center">Training:133</td>
<td valign="top" align="center">55/78</td>
<td valign="top" align="center">54.3 &#xb1; 12.5</td>
<td valign="top" align="center">DC+DD+LE+PE</td>
<td valign="top" align="center">LDA, SVM-RBF, LR, KNN, NB</td>
<td valign="top" align="center">AUC, sensitivity, specificity, accuracy, F1</td>
<td valign="top" align="center">INV</td>
</tr>
<tr>
<td valign="top" align="left">Song et&#xa0;al. (2019) (<xref ref-type="bibr" rid="B58">58</xref>)</td>
<td valign="top" align="center">USA</td>
<td valign="top" align="center">Cohort</td>
<td valign="top" align="center">DI</td>
<td valign="top" align="center">Total: 15645<break/>Training: 8089<break/>Internal validation: 3461<break/>External validation: 4086</td>
<td valign="top" align="center">7726/7919</td>
<td valign="top" align="center">59.0 &#xb1; 14.0</td>
<td valign="top" align="center">DC+DD+LE+PE+CI</td>
<td valign="top" align="center">GBM</td>
<td valign="top" align="center">AUC, sensitivity, specificity, accuracy, F1</td>
<td valign="top" align="center">INV+EXV</td>
</tr>
<tr>
<td valign="top" align="left">Wang et&#xa0;al. (2021) (<xref ref-type="bibr" rid="B59">59</xref>)</td>
<td valign="top" align="center">China</td>
<td valign="top" align="center">Cross</td>
<td valign="top" align="center">DI</td>
<td valign="top" align="center">Training:2163</td>
<td valign="top" align="center">1227/949</td>
<td valign="top" align="center">57.27 &#xb1; 11.93</td>
<td valign="top" align="center">DC+MH+DD+SH+PE</td>
<td valign="top" align="center">LR</td>
<td valign="top" align="center">AUC</td>
<td valign="top" align="center">INV</td>
</tr>
<tr>
<td valign="top" align="left">Shi et&#xa0;al. (2023) (<xref ref-type="bibr" rid="B60">60</xref>)</td>
<td valign="top" align="center">China</td>
<td valign="top" align="center">Cross</td>
<td valign="top" align="center">DI</td>
<td valign="top" align="center">Total: 512<break/>Training: 360<break/>Internal validation:155</td>
<td valign="top" align="center">329/186</td>
<td valign="top" align="center">54.1 &#xb1; 0.64</td>
<td valign="top" align="center">DC+MH+DD+LE+PE</td>
<td valign="top" align="center">RF, SVM, GBDT, Adaboost</td>
<td valign="top" align="center">AUC</td>
<td valign="top" align="center">INV</td>
</tr>
<tr>
<td valign="top" align="left">Leung et&#xa0;al. (2013) (<xref ref-type="bibr" rid="B61">61</xref>)</td>
<td valign="top" align="center">China</td>
<td valign="top" align="center">Cohort</td>
<td valign="top" align="center">PR</td>
<td valign="top" align="center">Total: 673<break/>Training: 360<break/>Internal validation:155</td>
<td valign="top" align="center">277/396</td>
<td valign="top" align="center">57 &#xb1; 8.5</td>
<td valign="top" align="center">DC+DD+LE+PE+GA</td>
<td valign="top" align="center">SVM, Cforest</td>
<td valign="top" align="center">AUC, sensitivity, specificity, accuracy, F1</td>
<td valign="top" align="center">INV</td>
</tr>
<tr>
<td valign="top" align="left">Su et&#xa0;al. (2023) (<xref ref-type="bibr" rid="B62">62</xref>)</td>
<td valign="top" align="center">China</td>
<td valign="top" align="center">Cohort</td>
<td valign="top" align="center">DI</td>
<td valign="top" align="center">Total: 219<break/>Training: 175<break/>Internal validation:44</td>
<td valign="top" align="center">140/79</td>
<td valign="top" align="center">56.15 &#xb1; 10.98</td>
<td valign="top" align="center">DC+LE</td>
<td valign="top" align="center">KNN, SVM, LR</td>
<td valign="top" align="center">sensitivity, specificity, accuracy, F1, MCC, AUC</td>
<td valign="top" align="center">INV</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>Cross, cross-sectional study; Cohort, Cohort Study; Case, Case-Control Study; DI, diagnostic model; PR, prognostic model; MH, medical history; LE, laboratory examinations; DC, demographic characteristics; CI, complications information; SH, social-lifestyle history; RP, Retinal Photographs; DD, Diabetes duration; PD, previous drug used; PE, Physical Examination; RS, Radiomic Signatures; FH, family history; GA, genetic attributes; CM, circulating metabolites; RH, renal histopathological results; LR, logistic regression; RF, random forest; DT, decision tree; SVM, support vector machine; GBDT, gradient boosted decision trees; BN, Bayesian networks; NB, Naive Bayes; AdaBoost, Adaptive Boosting; LASSO, Least Absolute Shrinkage and Selection Operator; MICE, Multivariate Imputation by Chained Equations; RFECV, Recursive Feature Elimination with Cross-Validation; GA, Genetic Algorithm; PCA, Principal Component Analysis; XGBoost, Extreme Gradient Boosting; KNN, K-Nearest Neighbors; AUC, area under the receiver operating characteristic curve; INV, Internal validation; EXV, External validation.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<p>Most of the data were obtained from electronic health record systems (EHRs) in hospitals, with a smaller proportion sourced from specialized disease research public databases, such as the Singapore Eye Disease Epidemiology Study Database and the Diabetic Retinopathy Comprehensive Project (<xref ref-type="bibr" rid="B26">26</xref>, <xref ref-type="bibr" rid="B44">44</xref>, <xref ref-type="bibr" rid="B45">45</xref>, <xref ref-type="bibr" rid="B54">54</xref>). The included variables typically encompass demographic information (e.g., gender, age), disease characteristics (e.g., medical history, disease duration, complications), lifestyle factors (e.g., smoking, alcohol consumption), physical examination measures (e.g., height, weight), and clinical laboratory test results (e.g., blood and urine analysis). Additionally, some studies incorporated circulating metabolites (<xref ref-type="bibr" rid="B26">26</xref>, <xref ref-type="bibr" rid="B45">45</xref>) and genetic parameters (<xref ref-type="bibr" rid="B26">26</xref>, <xref ref-type="bibr" rid="B56">56</xref>) as variables. Furthermore, some studies used unstructured data, such as renal pathology images (<xref ref-type="bibr" rid="B39">39</xref>), retinal color fundus photographs (<xref ref-type="bibr" rid="B26">26</xref>, <xref ref-type="bibr" rid="B44">44</xref>, <xref ref-type="bibr" rid="B60">60</xref>), and renal ultrasound images (<xref ref-type="bibr" rid="B48">48</xref>).</p>
<p>Regarding the types of predictive models, 18 studies focused on diagnostic models (<xref ref-type="bibr" rid="B39">39</xref>&#x2013;<xref ref-type="bibr" rid="B41">41</xref>, <xref ref-type="bibr" rid="B43">43</xref>&#x2013;<xref ref-type="bibr" rid="B45">45</xref>, <xref ref-type="bibr" rid="B47">47</xref>&#x2013;<xref ref-type="bibr" rid="B49">49</xref>, <xref ref-type="bibr" rid="B51">51</xref>&#x2013;<xref ref-type="bibr" rid="B54">54</xref>, <xref ref-type="bibr" rid="B57">57</xref>&#x2013;<xref ref-type="bibr" rid="B60">60</xref>, <xref ref-type="bibr" rid="B62">62</xref>), while the remaining 8 were prognostic models (<xref ref-type="bibr" rid="B26">26</xref>, <xref ref-type="bibr" rid="B42">42</xref>, <xref ref-type="bibr" rid="B46">46</xref>, <xref ref-type="bibr" rid="B50">50</xref>, <xref ref-type="bibr" rid="B55">55</xref>, <xref ref-type="bibr" rid="B56">56</xref>, <xref ref-type="bibr" rid="B61">61</xref>). Among the prognostic models, the study by Leung et&#xa0;al. (<xref ref-type="bibr" rid="B61">61</xref>) had the longest median follow-up period of 7.8 years, whereas the study by Song et&#xa0;al. (<xref ref-type="bibr" rid="B50">50</xref>) had a follow-up period of only 1 year.</p>
<p>Twenty-five studies conducted internal validation, using either holdout validation sets or K-fold cross-validation. The total sample size across all internal validation was 319,190 participants. However, there was substantial variation in sample sizes among the studies, with Nicolucci et&#xa0;al. (<xref ref-type="bibr" rid="B27">27</xref>) having the largest sample size of 147,664, and Maniruzzaman et&#xa0;al. (<xref ref-type="bibr" rid="B57">57</xref>) having the smallest with 133. External validation was performed in 8 studies (<xref ref-type="bibr" rid="B27">27</xref>, <xref ref-type="bibr" rid="B39">39</xref>, <xref ref-type="bibr" rid="B44">44</xref>&#x2013;<xref ref-type="bibr" rid="B46">46</xref>, <xref ref-type="bibr" rid="B52">52</xref>, <xref ref-type="bibr" rid="B56">56</xref>, <xref ref-type="bibr" rid="B58">58</xref>). 4 studies employed external validation using datasets independent of the training set (<xref ref-type="bibr" rid="B27">27</xref>, <xref ref-type="bibr" rid="B39">39</xref>, <xref ref-type="bibr" rid="B44">44</xref>, <xref ref-type="bibr" rid="B45">45</xref>). 3 studies used a temporal split method, dividing data chronologically into training and external validation sets, with earlier data used for training and later data for external validation (<xref ref-type="bibr" rid="B46">46</xref>, <xref ref-type="bibr" rid="B52">52</xref>, <xref ref-type="bibr" rid="B58">58</xref>). For instance, Hosseini Sarkhosh et&#xa0;al. (<xref ref-type="bibr" rid="B46">46</xref>) used data from 2012-2016 as the training set and data from 2017-2021 as the external validation set. Additionally, while the internal and external validation sets in the study by Allen et&#xa0;al. (<xref ref-type="bibr" rid="B56">56</xref>) were derived from the same large dataset, the external validation set consisted solely of clinical data, which was independent of the training set. 7 of those external validation had a combined external validation sample size of 37,944. One study conducted external validation across 5 different centers (<xref ref-type="bibr" rid="B27">27</xref>), with reported cohort sizes ranging from 3,912 to 200,007, though specific sample sizes for the other centers were not provided.</p>
</sec>
<sec id="s3_3">
<label>3.3</label>
<title>ML models and performance evaluation</title>
<p>There were 26 ML models involved across 26 studies. The most commonly applied ML algorithms included logistic regression (LR, <italic>n</italic> = 11), random forest (RF, <italic>n</italic> = 9), decision tree (DT, <italic>n</italic> = 9), support vector machine (SVM, <italic>n</italic> = 6), gradient boosted decision trees (GBDT, <italic>n</italic> = 5), Bayesian networks (BN, <italic>n</italic> = 3), Naive Bayes (NB, <italic>n</italic> = 3), Adaptive Boosting (AdaBoost, <italic>n</italic> = 3), and Least Absolute Shrinkage and Selection Operator (LASSO, <italic>n</italic> = 3). All studies used classical methods to assess the discriminative ability of ML models. We used AUC and associated 95% CI as the primary ability metrics. Additionally, other ability evaluation metrics included Accuracy, Specificity, Sensitivity, Jordan index, Precision score, Recall score, PPV, and NPV, and F1 score.</p>
</sec>
<sec id="s3_4">
<label>3.4</label>
<title>Handling of missing data</title>
<p>Most studies addressed missing data using various imputation methods. Among them, six studies used mean or median imputation (<xref ref-type="bibr" rid="B45">45</xref>, <xref ref-type="bibr" rid="B46">46</xref>, <xref ref-type="bibr" rid="B52">52</xref>, <xref ref-type="bibr" rid="B54">54</xref>, <xref ref-type="bibr" rid="B56">56</xref>, <xref ref-type="bibr" rid="B61">61</xref>). Momenzadeh et&#xa0;al. (<xref ref-type="bibr" rid="B42">42</xref>) applied the MissForest imputation method, while Liu et&#xa0;al. (<xref ref-type="bibr" rid="B40">40</xref>) employed the Multivariate Imputation by Chained Equations (MICE) algorithm. Additionally, 2 studies used ML algorithms for imputation (<xref ref-type="bibr" rid="B55">55</xref>, <xref ref-type="bibr" rid="B60">60</xref>). However, 3 studies only mentioned the use of imputation without specifying the exact methods employed (<xref ref-type="bibr" rid="B27">27</xref>, <xref ref-type="bibr" rid="B50">50</xref>, <xref ref-type="bibr" rid="B53">53</xref>). Three studies excluded missing data directly (<xref ref-type="bibr" rid="B39">39</xref>, <xref ref-type="bibr" rid="B44">44</xref>, <xref ref-type="bibr" rid="B48">48</xref>), while 6 studies selectively excluded missing data based on a certain proportion (<xref ref-type="bibr" rid="B26">26</xref>, <xref ref-type="bibr" rid="B41">41</xref>, <xref ref-type="bibr" rid="B47">47</xref>, <xref ref-type="bibr" rid="B49">49</xref>, <xref ref-type="bibr" rid="B51">51</xref>, <xref ref-type="bibr" rid="B58">58</xref>). There were also 3 studies that did not mention their method to handling missing data (<xref ref-type="bibr" rid="B57">57</xref>, <xref ref-type="bibr" rid="B59">59</xref>, <xref ref-type="bibr" rid="B62">62</xref>). Furthermore, one prospective study had no missing data, and thus, did not involve any imputation methods (<xref ref-type="bibr" rid="B43">43</xref>).</p>
</sec>
<sec id="s3_5">
<label>3.5</label>
<title>Methods of selecting predictors</title>
<p>Of the studies reviewed, two did not mention the method used for predictor selection (<xref ref-type="bibr" rid="B27">27</xref>, <xref ref-type="bibr" rid="B44">44</xref>), one used all available features as predictors (<xref ref-type="bibr" rid="B42">42</xref>), and another determined predictors based on existing literature and expert consensus (<xref ref-type="bibr" rid="B56">56</xref>). The remaining 22 studies detailed their methods for predictors selection. The most frequently employed method was Recursive Feature Elimination with Cross-Validation (RFECV), followed by the LASSO. Additionally, some studies used multivariate LR, the Markov Blanket, the Genetic Algorithm (GA) feature selection method, and various ML algorithms, including RF, GBDT, Gradient Boosting Machine (GBM), SVM, DT, Extreme Gradient Boosting (XGBoost), and Principal Component Analysis (PCA) et&#xa0;al. for selecting predictors.</p>
</sec>
<sec id="s3_6">
<label>3.6</label>
<title>Quality of evidence and risk of bias</title>
<p>All included studies were assessed for risk of bias using the PROBAST tool. Overall, with the exception of two studies that were assessed as low risk and one study that was assessed as unclear risk, the remaining studies were assessed as having a high risk of bias. In domain 4 (statistical analysis), a significant proportion of studies had a high risk of bias. In particular, 14 studies failed to properly assess the discrimination and calibration of the prediction models, which is a common source of bias. Furthermore, 53.8% of the studies did not assess whether the coefficients and intercepts of the final predictors in the development phase were consistent with the results reported in the multivariable analysis, another common bias. Although the vast majority of studies (96.1%) conducted internal validation, a portion of these studies (34.6%) relied solely on random data splitting as internal validation, which cannot be considered a proper application of internal validation methods. This leading to an increased risk of bias. Eleven studies (42.3%) did not provide adequate explanations for handling complex data. Eight studies (30.8%) failed to appropriately address missing data in their included subjects. Additionally, 8 studies (30.8%) had unreasonable sample size designs, with 4 studies having an event-per-variable (EPV) ratio of less than 10 during the development of predictive models, and another 4 studies having a validation cohort sample size of fewer than 100 cases. These results indicate that potential bias may be present in the majority of the included studies, which should be considered carefully when interpreting the results. A summary table of the results from the PROBAST assessment can be seen in <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table&#xa0;2</bold>
</xref>.</p>
</sec>
<sec id="s3_7">
<label>3.7</label>
<title>Statistical analysis</title>
<p>Twenty-five studies underwent internal validation, while only 8 studies performed external validation (<xref ref-type="bibr" rid="B27">27</xref>, <xref ref-type="bibr" rid="B39">39</xref>, <xref ref-type="bibr" rid="B44">44</xref>&#x2013;<xref ref-type="bibr" rid="B46">46</xref>, <xref ref-type="bibr" rid="B52">52</xref>, <xref ref-type="bibr" rid="B56">56</xref>, <xref ref-type="bibr" rid="B58">58</xref>). A total of 94 ML models were developed, with 81 models in the internal validation set and 13 models in the external validation set. The meta-analysis of the AUC included data from 25 studies for internal validation sets and 8 studies for external validation sets. Since most studies employed multiple ML models, we first pooled their AUC, as shown in <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table&#xa0;3</bold>
</xref>.&#xa0;A meta-analysis was then subsequently performed using the pooled AUC from each study. The pooled AUC in the internal set was 0.839 (95% CI 0.787-0.890; <italic>I</italic>&#xb2;= 99.8%; <italic>P</italic> = 0.000 for heterogeneity), with a 95% PI ranging from 0.56 to 1.00. In contrast, the pooled AUC in the external validation set was 0.830 (95% CI 0.784-0.877; <italic>I</italic>&#xb2;= 95.6%; <italic>P</italic> = 0.000 for heterogeneity), with a narrower 95% PI of 0.64-0.97 that excluded 1, indicating more stable performance and better generalizability across external datasets, despite significant heterogeneity. Moreover, these results indicated a marginally higher pooled AUC in the internal validation set compared to the external validation set. The results of the meta-analysis were presented in <xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2</bold>
</xref>.</p>
<fig id="f2" position="float">
<label>Figure&#xa0;2</label>
<caption>
<p>Random effects forest plot of area under the curve (AUC) values with 95% confidence intervals (CI) in internal and external validation. AUC, area under the receiver operator characteristic curve. The weight % represents the contribution of each study to the overall analysis. The diamond shapes indicate pooled AUC estimates for each subgroup (internal, external) and the overall analysis. Horizontal lines represent the confidence intervals for individual studies, and the dashed vertical line indicates the pooled AUC estimate. p values from Cochran&#x2019;s Q test.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fendo-16-1495306-g002.tif"/>
</fig>
<p>To identify potential sources of heterogeneity, we conducted subgroup analyses based on study type and prediction model type using the internal validation datasets. Individually, the pooled AUC for cross-sectional studies was 0.848 (95% CI 0.770-0.926; <italic>I</italic>&#xb2;= 99.2%; <italic>P</italic> = 0.000 for heterogeneity), for cohort studies it was 0.833 (95% CI 0.775-0.891; <italic>I</italic>&#xb2;= 99.5%; <italic>P</italic> = 0.000 for heterogeneity). Notably, case-control demonstrated a pooled AUC of 0.858 (95% CI 0.817-0.900) with significantly reduced heterogeneity (<italic>I</italic>&#xb2; = 23.0%; <italic>P</italic> = 0.254). When grouped by prediction model type, pooled AUC was 0.797 (95% CI 0.757-0.836; <italic>I</italic>&#xb2;= 97.7%; <italic>P</italic> = 0.000 for heterogeneity) for prognostic models and 0.856 (95% CI 0.815-0.896; <italic>I</italic>&#xb2;= 99.5%; <italic>P</italic> = 0.000 for heterogeneity) for diagnostic models. The results of the meta-analysis were presented in <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figures&#xa0;1</bold>
</xref>, <xref ref-type="supplementary-material" rid="SM1">
<bold>2</bold>
</xref>.</p>
<p>All used algorithms according to the history of ML into traditional regression ML models (<italic>n</italic> = 14), ML models (<italic>n</italic> = 21), and deep learning (DL) models (<italic>n</italic> = 4). Traditional regression ML models refer to those that use regression techniques of ML, including LR and LASSO. ML models are more complex than traditional regression ML models (such as RF, DT, SVM, et&#xa0;al). Additionally, we defined DL models as neural networks with two or more hidden layers, such as CNN and ANN. We then pooled their AUC. The results indicated that the pooled AUC for traditional regression ML models was 0.797 (95% CI 0.777-0.816) with significant heterogeneity (<italic>I</italic>&#xb2;= 96.7%, <italic>P</italic> = 0.000), for ML models was 0.811 (95% CI 0.785-0.836; <italic>I</italic>&#xb2;= 99.9%, <italic>P</italic> = 0.000 for heterogeneity). In contrast, the pooled AUC for DL models was 0.863 (95% CI 0.825-0.900; <italic>I</italic>&#xb2;= 81.1%, <italic>P</italic> = 0.000 for heterogeneity), indicating a outperformed both ML and traditional regression ML models. The results of the meta-analysis were presented in <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figure&#xa0;3</bold>
</xref>.</p>
<p>A total of 26 different ML models were analyzed. To identify which models performed best, we pooled and compared the AUC of those models that were used three or more times. The results indicated that the pooled AUCs were as follows: AdaBoost, 0.798 (95% CI 0.729-0.868); BN, 0.815 (95% CI 0.777-0.854); DT, 0.748 (95% CI 0.567-0.929); GBDT, 0.821 (95% CI 0.757-0.885); LASSO, 0.820 (95% CI 0.816-0.825); LR, 0.793 (95% CI 0.764-0.823); NB, 0.788 (95% CI 0.737-0.840); RF, 0.848 (95% CI 0.785-0.911); SVM, 0.825 (95% CI 0.690-0.960); and XGBoost, 0.829 (95% CI 0.724-0.934). Among the models, the RF exhibited the best performance, while the DT model had the lowest performance; however, these differences were not statistically significant. Despite the high degree of heterogeneity, the 95% PIs for ML models demonstrated statistical significance (0.53&#x2013;1.00). The results of the meta-analysis were presented in <xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3</bold>
</xref>.</p>
<fig id="f3" position="float">
<label>Figure&#xa0;3</label>
<caption>
<p>Random effects forest plot of area under the curve (AUC) values with 95% confidence intervals (CI) in machine learning (ML) type. AUC, area under the curve; AdaBoost, Adaptive Boosting; BN, Bayesian networks; DT, decision tree; GBDT, gradient boosted decision trees; LASSO, Least Absolute Shrinkage and Selection Operator; LR, logistic regression; NB, Naive Bayes; RF, random forest; SVM, support vector machine; XGBoost, Extreme Gradient Boosting. The weight % represents the contribution of each study to the overall analysis. The diamond shapes indicate pooled AUC estimates for each subgroup (internal, external) and the overall analysis. Horizontal lines represent the confidence intervals for individual studies, and the dashed vertical line indicates the pooled AUC estimate. p values from Cochran&#x2019;s Q test.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fendo-16-1495306-g003.tif"/>
</fig>
</sec>
<sec id="s3_8">
<label>3.8</label>
<title>Sensitivity analysis</title>
<p>A total of 25 studies were included, and excluding any single study did not result in a statistically significant difference in the pooled results from the remaining studies (<italic>n</italic> = 24). The results remained consistent with the original pooled AUC (0.84, 95% CI 0.79-0.89), indicating the stability of the findings. The results of the sensitivity analysis were presented in <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figure&#xa0;4</bold>
</xref>.</p>
</sec>
<sec id="s3_9">
<label>3.9</label>
<title>Predictors screened</title>
<p>The final predictors selected for developing the ML model can be categorized into 14 types: demographic characteristics, medical history, T2DM duration, previous drug use history, complication information, social lifestyle history, family history, physical examination, laboratory examinations, renal histopathological results, radiomic signatures, circulating metabolites, genetic attributes, and retinal photographs. Based on these studies, we can identify several risk factors for the development of DKD in patients with T2DM. These include age, gender, race; history of hypertension, cardiovascular disease, cerebrovascular disease; T2DM duration; smoking, alcohol; family history of diabetes; use of antidiabetic (e.g., insulin, glinides, TZDs) and antihypertensive medications; complications such as diabetic retinopathy and diabetic peripheral vascular disease; physical examination parameters like height, weight, BMI, pulse pressure, systolic blood pressure (SBP), diastolic blood pressure (DBP), and waist-to-hip ratio; Additionally, laboratory examinations result such as 2-hour Postprandial glucose (2hPPG), glucose, insulin, fasting blood glucose (FBG), hemoglobin A1c, low-density lipoprotein (LDL), high-density lipoprotein(HDL), triglycerides, total cholesterol; circulating metabolites like tyrosine, lactate, intermediate-density lipoprotein cholesteryl ester % (IDL-CE%); and citrate, genetic attributes including uteroglobin gene G38A mutation (UGB G38A), LIPC514C &gt; T, and apolipoprotein B threonine to isoleucine substitution at position 71 (APOBThr71Ile); as well as renal histopathological results; retinal photographs, and renal radiomic signatures. We have integrated these predictors, as shown in <xref ref-type="table" rid="T2">
<bold>Table&#xa0;2</bold>
</xref>.</p>
<table-wrap id="T2" position="float">
<label>Table&#xa0;2</label>
<caption>
<p>Predictors included in the machine learning model.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" align="center">Feature</th>
<th valign="middle" align="center">Final Predictors</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Demographic characteristics</td>
<td valign="top" align="left">Age, Gender, Race</td>
</tr>
<tr>
<td valign="top" align="left">Medical history</td>
<td valign="top" align="left">Hypertension, Cardiovascular disease, Cerebrovascular disease</td>
</tr>
<tr>
<td valign="top" align="left">Duration</td>
<td valign="top" align="left">T2DM duration</td>
</tr>
<tr>
<td valign="top" align="left">Social lifestyle history</td>
<td valign="top" align="left">Smoking, Alcohol</td>
</tr>
<tr>
<td valign="top" align="left">Family history</td>
<td valign="top" align="left">Family history of diabetes</td>
</tr>
<tr>
<td valign="top" align="left">Histopathological</td>
<td valign="top" align="left">Renal histopathological results</td>
</tr>
<tr>
<td valign="top" align="left">Radiomic signatures</td>
<td valign="top" align="left">Renal radiomic signatures</td>
</tr>
<tr>
<td valign="top" align="left">Photographs</td>
<td valign="top" align="left">Retinal Photographs</td>
</tr>
<tr>
<td valign="top" align="left">Circulating metabolites</td>
<td valign="top" align="left">Tyrosine, Lactate, DL-CE%, Citrate, Glycoprotein acetyls, LLDL-PL%, Alanine.</td>
</tr>
<tr>
<td valign="top" align="left">Genetic attributes</td>
<td valign="top" align="left">(Urinary Glucose Blood Glycine 38 to Alanine Mutation) UGB G38A, Lipase C Gene Mutation (514C &gt; T) (LIPC514C &gt; T), Apolipoprotein B Threonine 71 to Isoleucine Mutation (APOBThr71Ile), Apolipoprotein C3 Gene Mutation (3206T &gt; G) (APOC33206T &gt; G) and Apolipoprotein C3 Gene Mutation (1100C &gt; T) (APOC31100C &gt; T)</td>
</tr>
<tr>
<td valign="top" align="left">Previous drug use history</td>
<td valign="top" align="left">Antidiabetic medications: insulin use, TZDs, glinides, DPP-4 inhibitors, GLP-1 receptor agonists, SGLT-2 inhibitors; Antihypertensive medications</td>
</tr>
<tr>
<td valign="top" align="left">Complication information</td>
<td valign="top" align="left">Diabetic retinopathy<break/>Diabetic peripheral vascular disease<break/>Macrovascular complications of diabetes</td>
</tr>
<tr>
<td valign="top" align="left">Physical examination</td>
<td valign="top" align="left">Height, Weight, BMI, Pulse pressure, SBP, DBP, DAP, SAP</td>
</tr>
<tr>
<td valign="top" align="left">Laboratory examinations</td>
<td valign="top" align="left">2hPPG, GLU, INS, FBG, HbA1c;<break/>LDL, HDL, TG, TC, Apo-A, Apo-B, APB: APA;<break/>BUN, CREA, BUN/CREA, UA, eGFR, 24h-UTP, MAU, ACR, CYS-C, hematuria, significant proteinuria;<break/>ALB, GLB, ALP, &#x3b3;GGT, ALT, AST;<break/>HCT, WBC, PLT, PDW, MCHC, HGB, PCV, RDW-SD, RDW, MPV, Mon%, Bas, Eos, Neu, P-LCR, Lym;<break/>FT3, TSH, IGF-1, FIB, INR, Tyr, C2, C4DC, C5DC, C24, Na, K, PP, PLT, PT, TT, Bicarbonate, DHA, LLDL-CE%, IDLC%.</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>T2DM, Type 2 Diabetes Mellitus; DL-CE%, Double Layer Cholesterol Ester Percentage; LLDL-PL%, Large Low-Density Lipoprotein Phospholipid Percentage; UGB, Urinary Glucose Blood; G38A, Glycine 38 to Alanine Mutation; LIPC514C &gt; T, Lipase C Gene Mutation (514C &gt; T); APOBThr71Ile, Apolipoprotein B Threonine 71 to Isoleucine Mutation; APOC33206T &gt; G, Apolipoprotein C3 Gene Mutation (3206T &gt; G); APOC31100C &gt; T, Apolipoprotein C3 Gene Mutation (1100C &gt; T); TZDs, Thiazolidinediones; DPP-4, Dipeptidyl Peptidase-4; GLP-1, Glucagon-Like Peptide-1; SGLT-2, Sodium-Glucose Cotransporter-2; BMI, Body Mass Index; SBP, Systolic blood pressure; DBP, Diastolic blood pressure; DAP, Waist-to-hip ratio, Diastolic arterial pressure; SAP, Systolic arterial pressure; 2hPPG, 2-hour Postprandial Plasma Glucose; GLU, Glucose; INS, Insulin; FBG, Fasting Blood Glucose; HbA1c, Hemoglobin A1c; LDL, Low-Density Lipoprotein; HDL, High-Density Lipoprotein; TG, Triglycerides; TC, Total Cholesterol; Apo-A, Apolipoprotein A; Apo-B, Apolipoprotein B; APA, Apoptosis-Associated Protein; BUN, Blood Urea Nitrogen; CREA, Creatinine; BUN/CREA, Blood Urea Nitrogen to Creatinine Ratio; UA, Uric Acid; eGFR, Estimated Glomerular Filtration Rate; 24h-UTP, 24-hour Urinary Total Protein; MAU, Microalbuminuria; ACR, Albumin-to-Creatinine Ratio; CYS-C, Cystatin C; ALB, Albumin; GLB, Globulin; ALP, Alkaline Phosphatase; &#x3b3;GGT, Gamma-Glutamyl transferase; ALT, Alanine Aminotransferase; AST, Aspartate Aminotransferase; HCT, Hematocrit; WBC; White Blood Cell Count; PLT, Platelet Count; PDW, Platelet Distribution Width; MCHC, Mean Corpuscular Hemoglobin Concentration; HGB, Hemoglobin; PCV, Packed Cell Volume; RDW-SD, Red Cell Distribution Width-Standard Deviation; RDW, Red Cell Distribution Width; MPV, Mean Platelet Volume; Mon%, Monocyte Percentage; Bas, Basophil Count; Eos, Eosinophil Count; Neu, Neutrophil Count; P-LCR, Platelet Large Cell Ratio; Lym, Lymphocyte Count; FT3, Free Triiodothyronine; TSH, Thyroid-Stimulating Hormone; IGF-1, Insulin-Like Growth Factor-1; FIB, Fibrinogen; INR, International Normalized Ratio; Tyr, Tyrosine; C2, Carnitine C2 (Acetylcarnitine); C4DC, Butyrylcarnitine (C4 Dicarboxylate); C5DC, Glutarylcarnitine (C5 Dicarboxylate); C24 - Tetracosanoylcarnitine (C24); PP, Pancreatic Polypeptide; PT, Prothrombin Time; TT, Thrombin Time; Bicarbonate, Bicarbonate Ion; DHA, Docosahexaenoic Acid; LLDL-CE%, Large Low-Density Lipoprotein Cholesterol Ester Percentage; IDLC%, Intermediate-Density Lipoprotein Cholesterol Percentage.</p>
</fn>
</table-wrap-foot>
</table-wrap>
</sec>
</sec>
<sec id="s4" sec-type="discussion">
<label>4</label>
<title>Discussion</title>
<p>This meta-analysis systematically evaluated the application of ML-based risk prediction models for assessing the risk of DKD in patients with T2DM. We conducted a comprehensive analysis of 26 studies, exploring critical aspects such as study quality, the stability of internal and external validation, the performance of various ML models, and the types of predictive factors used.</p>
<p>Early prediction and identification of DKD are crucial for preserving renal function in patients with T2DM. This can lead to timely therapeutic interventions and lifestyle modifications, preventing disease progression to advanced stages and reducing dependence on dialysis and high healthcare expenditures (<xref ref-type="bibr" rid="B63">63</xref>). However, DKD often manifests insidiously. Our analysis indicated that ML demonstrates promising performance in predicting and identifying DKD in T2DM patients. The pooled AUC from internal validation sets was 0.839 (95% CI 0.787-0.890), and for external validation, it was 0.830 (95% CI 0.784-0.877). These findings suggest that our study could provide valuable insights for early clinical prediction of DKD.</p>
<p>It is important to note that the pooled AUC demonstrates considerable heterogeneity. This heterogeneity among subgroups may stem from variations in data sources and types. The studies included in this analysis draw upon diverse datasets, encompassing prospective clinical sample collections, publicly available datasets, and electronic health records. The data types also vary, including clinical laboratory tests, blood metabolomics, imaging, and genomics. All of which may contribute to the observed heterogeneity. Moreover, variations in the assessment tools for DKD, the demographic characteristics of the study populations, and the types of research designs may contribute to the heterogeneity across studies. In our analysis, the sample sizes of the included studies varied significantly, ranging from 133 to 147,664 participants. While sample size is an important factor, the proportion of positive cases is arguably more critical, as it determines the weight of each study. Consequently, a larger sample size may not directly influence the AUC value. However, studies with smaller sample sizes may experience a reduction in machine learning model performance, which could also serve as a potential source of heterogeneity.</p>
<p>Despite the significant potential demonstrated by extant studies in the application of machine learning for multidimensional data processing and risk prediction, the lack of external validation using completely independent datasets remains a major methodological issue in risk prediction model research (<xref ref-type="bibr" rid="B64">64</xref>, <xref ref-type="bibr" rid="B65">65</xref>). Similarly, among the 26 studies included in our review, only 8 conducted external validation (<xref ref-type="bibr" rid="B27">27</xref>, <xref ref-type="bibr" rid="B39">39</xref>, <xref ref-type="bibr" rid="B44">44</xref>&#x2013;<xref ref-type="bibr" rid="B46">46</xref>, <xref ref-type="bibr" rid="B52">52</xref>, <xref ref-type="bibr" rid="B56">56</xref>, <xref ref-type="bibr" rid="B58">58</xref>), while the remaining studies did not employ external validation. External validation is imperative for evaluation of a model&#x2019;s robustness and generalizability (<xref ref-type="bibr" rid="B66">66</xref>&#x2013;<xref ref-type="bibr" rid="B68">68</xref>). It not only evaluates the model&#x2019;s predictive ability but also tests its adaptability to new environments or different datasets, thereby revealing its effectiveness and limitations in real-world clinical practice (<xref ref-type="bibr" rid="B69">69</xref>). Although the negligible discrepancy (AUC values from internal and external validation sets differed by only 0.009), the absence of external validation hinders our understanding of the actual capability of the generalizability in our pooled models. This limitation restricts the applicability of our findings to diverse regions, environments, and healthcare systems. In addition, model overfitting or selectivity bias can result in good performance on the training set but poor performance on the external validation set (<xref ref-type="bibr" rid="B70">70</xref>). External validation can reveal whether the model has overfitted the training set, as well as selective bias during internal validation. In our study, it is also not yet clear whether there is overfitting or selective bias in the training set data due to the lack of external validation.</p>
<p>ML enhances model performance by synthesizing complex relationships among variables, surpassing traditional statistical analysis methods (<xref ref-type="bibr" rid="B67">67</xref>). Currently, ML algorithms are widely applied in the healthcare industry, demonstrating significant advantages in disease risk prediction. Another meta-analysis by Saputro et&#xa0;al. (<xref ref-type="bibr" rid="B8">8</xref>) focused solely on the performance of traditional Cox regression and LR models, without reporting on other ML techniques. Our study is the first systematic review to predict the risk of DKD in T2DM patients using ML algorithms. We categorized ML models according to their chronological development into traditional regression ML models, general ML models, and DL models, and subsequently compared their performance. Our results indicated that DL models consistently outperform both regression-based and other ML models, aligning with findings from previous studies (<xref ref-type="bibr" rid="B71">71</xref>, <xref ref-type="bibr" rid="B72">72</xref>). The superior performance of DL models in these studies can be attributed to their capacity to process unstructured data (<xref ref-type="bibr" rid="B73">73</xref>). Such data include diabetic retinal images, renal ultrasound scans, and renal pathology slides, which directly reflect the pathological state of DKD. DL models (CNN, ANN et&#xa0;al) are capable of automatically extracting high-dimensional features such as vascular morphology and renal tissue microstructure, which are often challenging for other traditional ML techniques to capture (<xref ref-type="bibr" rid="B74">74</xref>). However, traditional ML algorithms can still achieve high performance with less computational power and smaller datasets. These models predominantly rely on structured data, including demographic information, laboratory metrics, lifestyle factors, and other clearly defined data with standardized units, which underscores their inherent strengths. Notably, the study by Betzler et&#xa0;al. found that modeling based on DL in combination with risk factors obtained by RF screening yielded more effective results. Consequently, future studies that can integrate structural data and unstructured data by multimodal modeling may further improve the prediction of DKD risk.</p>
<p>In addition, we evaluated and compared the performance of common ML models (e.g., LR, RF, DT, SVM, etc.) separately. Our results indicated that the RF model yielded the highest performance, with a pooled AUC of 0.848 (95% CI 0.785-0.911), outperforming the other models. This superior performance may be attributed to unique ability to its unique ability to handle feature importance, strong generalization, avoidance of overfitting and proficiency in processing high-dimensional data (<xref ref-type="bibr" rid="B75">75</xref>, <xref ref-type="bibr" rid="B76">76</xref>). RF is an ensemble learning algorithm that solves classification and regression problems by constructing multiple DTs, enabling the model to effectively assess the relative importance of each feature in prediction (<xref ref-type="bibr" rid="B77">77</xref>). This characteristic aids in identifying the most influential predictors of DKD risk, thereby providing valuable support for clinical decision-making. Additionally, RF trains each tree by randomly selecting subsets of features and data, a strategy that significantly reduces the overfitting risks typically associated with individual models, thereby enhancing the model&#x2019;s generalizability. Moreover, RF&#x2019;s parallelization capability results in high computational efficiency, markedly reducing training time (<xref ref-type="bibr" rid="B78">78</xref>). This efficiency enables the RF model to process large-scale clinical data, such as electronic health records, genomic data, and imaging information, quickly. This makes RF particularly suitable for clinical settings where real-time predictions or immediate decision-making are required. Unlike our study, the meta-analysis by Feng et&#xa0;al. (<xref ref-type="bibr" rid="B79">79</xref>) found that the LR model achieved a higher AUC in predicting stroke onset timing. Similarly, Wu et&#xa0;al. reported that neural network algorithms outperformed others in screening for diabetic retinopathy (<xref ref-type="bibr" rid="B80">80</xref>). These results suggest that, in practical applications, the selection of a model should be based on the specific research objectives and the characteristics of the dataset.</p>
<p>The selection of effective features is of critical importance for the enhancement of both the predictive accuracy and interpretability of ML models in clinical applications. To this end, a comprehensive integration of the predictors that were ultimately incorporated into the models was conducted. The final selection comprised fourteen distinct categories of predictors, including demographic data, medical history, duration of T2DM, prior medication use, comorbidity profiles, lifestyle factors, family medical history, physical examination results, laboratory findings, renal biopsy data, radiomic features, circulating metabolites, genetic markers, and retinal imaging results. The heterogeneity of these predictive factors is reflective of the intricate and multifaceted pathophysiological underpinnings of DKD risk (<xref ref-type="bibr" rid="B81">81</xref>, <xref ref-type="bibr" rid="B82">82</xref>). It is noteworthy that age has been consistently validated in numerous studies as a pivotal predictor of DKD (<xref ref-type="bibr" rid="B5">5</xref>). Moreover, the duration of T2DM is recognized as a pivotal factor in DKD progression. Extensive research indicates that a longer duration of T2DM significantly escalates the risk of DKD, a phenomenon that is intrinsically linked to the chronic renal damage induced by sustained hyperglycemia (<xref ref-type="bibr" rid="B83">83</xref>, <xref ref-type="bibr" rid="B84">84</xref>). Furthermore, complications, such as diabetic retinopathy and peripheral vascular disease are also closely associated with an increased risk of DKD. These complications serve as hallmarks of systemic microvascular pathology, indicating an increased likelihood of renal impairment (<xref ref-type="bibr" rid="B85">85</xref>). The integration of emerging predictive factors, such as renal biopsy data, circulating metabolites, genetic markers, and radiomic features, underscores the forefront of interdisciplinary approaches in DKD risk prediction. These high-dimensional datasets enrich the input variables for complex models, thereby enhancing predictive precision and bolstering the models&#x2019; generalizability (<xref ref-type="bibr" rid="B81">81</xref>).</p>
<p>This study represents the first comprehensive review of the application of ML models for predicting DKD risk in patients with T2DM. A principal strength of our study is the rigorous and systematically developed methodology, which is not only logically sound but also sufficiently detailed to ensure reproducibility. Almost all published studies on the risk of DKD in patients with T2DM were included in this meta-analysis, facilitating comprehensive comparisons across different studies. In addition, we extensive searched multiple databases in accordance with PRISMA guidelines. Two independent reviewers systematically accomplished literature screening, data extraction, and a detailed risk of bias assessment using the PROBAST checklist, which improved the credibility and reliability of the study results.</p>
<p>The present study also reveals a number of limitations (1). The limited availability of external validation studies constrains the generalizability of our findings (2). The studies included in this meta-analysis varied in design, with the majority being retrospective single-center cohort studies, which are prone to selection bias and information bias (3). There is considerable variation in sample sizes across studies. Studies with smaller sample sizes may experience greater random error in estimating feature factors, leading to potential overfitting or underfitting of the model (4). The variability in the sources of predictive factors also affected the consistency of the study results. While the diversity of data sources enriches the model&#x2019;s input dimensions, it may also introduce issues related to data quality and consistency (5). Most studies exhibit notable shortcomings in handling missing data. These discrepancies may affect the prediction accuracy and stability of the models (6). There is considerable variation in the methods used for selecting predictive factors, and the choice of method can influence both the complexity and interpretability of the model.</p>
<p>The integration of ML with medical expertise maximizes its clinical efficacy. By providing clinicians with patient risk information and encouraging the active use of clinical decision-making tools, rather than passive reliance on them, early detection, treatment, and prognosis of diseases are significantly enhanced. Additionally, the streamlined presentation of data improves clinicians&#x2019; knowledge and experience, while the application of ML models can substantially reduce both time and economic costs. Therefore, we recommend that future research focus on the following aspects to enhance the standardization of study conduct and reporting, thereby advancing the field (1): In terms of study design, future research should focus on conducting large-scale prospective studies. (2) Concerning study populations, it is crucial to select appropriate data sources and ensure the rationality of inclusion and exclusion criteria. (3) For predictive factors, it is important to clearly define and assess these factors consistently across all populations and verify the effectiveness of the factors included in predictive models. (4) Appropriate methods for handling missing data should be employed. (5) Future research should place greater emphasis on external validation, particularly through the use of multi-center, large-scale datasets across diverse regions, to enhance the generalizability of the models. (6) In the discussion of results, a detailed evaluation of potential biases should be provided, along with exploration of strategies to mitigate these biases. (7) Whenever feasible, research data and processing codes should be made publicly available, and standardized evaluation datasets should be established to enhance the reproducibility and generalizability of future research. (8) Future studies should emphasize the transparency and standardization of data processing methods to ensure the reliability and broader applicability of results. (9) The integration of interpretable algorithms, such as the Shapley additive explanation (SHAP) algorithm, to interpret risk prediction models can help clinicians better understand the key drivers behind model predictions, thereby enhancing clinical decision-making.</p>
</sec>
<sec id="s5" sec-type="conclusions">
<label>5</label>
<title>Conclusion</title>
<p>ML algorithms have demonstrated high performance in predicting the risk of DKD in T2DM patients. By integrating various demographic characteristics, biomarkers, and clinical data, these models offer more precise risk predictions compared to traditional methods. However, challenges related to data bias during model development and validation still need to be addressed. Future research should focus on enhancing data transparency and standardization, as well as validating these models&#x2019; generalizability through multicenter studies. In summary, the application of machine learning in predicting diabetic nephropathy risk holds significant clinical value and represents a more selective and cost-effective screening method for diabetic nephropathy.</p>
</sec>
</body>
<back>
<sec id="s6" sec-type="data-availability">
<title>Data availability statement</title>
<p>The original contributions presented in the study are included in the article/<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Material</bold>
</xref>. Further inquiries can be directed to the corresponding authors.</p>
</sec>
<sec id="s7" sec-type="author-contributions">
<title>Author contributions</title>
<p>YL: Data curation, Formal analysis, Methodology, Software, Visualization, Writing &#x2013; original draft. NJ: Data curation, Formal analysis, Writing &#x2013; original draft. QZ: Data curation, Investigation, Writing &#x2013; original draft. YH: Data curation, Software, Writing &#x2013; review &amp; editing. AS: Writing &#x2013; review &amp; editing, Investigation. FY: Writing &#x2013; review &amp; editing, Investigation. ZZL: Writing &#x2013; review &amp; editing, Investigation. JH: Methodology, Writing &#x2013; review &amp; editing. ZTL: Methodology, Supervision, Writing &#x2013; review &amp; editing.</p>
</sec>
<sec id="s8" sec-type="funding-information">
<title>Funding</title>
<p>The author(s) declare that financial support was received for the&#xa0;research, authorship, and/or publication of this article. The study was financially supported by the National Key Research and&#xa0;Development Program of China (2022YFC3502400), the Traditional Chinese Medicine Innovation Teams and Talent Support Program (ZYYCXTD-D-202205), and the Chinese and Western Medicine Collaborative Chronic Disease Management Research Project (CXZH2024054).</p>
</sec>
<sec id="s9" sec-type="COI-statement">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec id="s10" sec-type="disclaimer">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec id="s11" sec-type="supplementary-material">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fendo.2025.1495306/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fendo.2025.1495306/full#supplementary-material</ext-link>
</p>
<supplementary-material xlink:href="DataSheet1.docx" id="SM1" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<label>1</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<collab>Kidney Disease: Improving Global Outcomes (KDIGO) Diabetes Work Group</collab>
</person-group>. <article-title>KDIGO 2022 clinical practice guideline for diabetes management in chronic kidney disease</article-title>. <source>Kidney Int</source>. (<year>2022</year>) <volume>102</volume>:<fpage>S1</fpage>&#x2013;<lpage>s127</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.kint.2022.06.008</pub-id>
</citation>
</ref>
<ref id="B2">
<label>2</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sun</surname> <given-names>H</given-names>
</name>
<name>
<surname>Saeedi</surname> <given-names>P</given-names>
</name>
<name>
<surname>Karuranga</surname> <given-names>S</given-names>
</name>
<name>
<surname>Pinkepank</surname> <given-names>M</given-names>
</name>
<name>
<surname>Ogurtsova</surname> <given-names>K</given-names>
</name>
<name>
<surname>Duncan</surname> <given-names>BB</given-names>
</name>
<etal/>
</person-group>. <article-title>IDF&#xa0;Diabetes Atlas: Global, regional and country-level diabetes prevalence estimates for&#xa0;2021 and projections for 2045</article-title>. <source>Diabetes Res Clin Pract</source>. (<year>2022</year>) <volume>183</volume>:<elocation-id>109119</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.diabres.2021.109119</pub-id>
</citation>
</ref>
<ref id="B3">
<label>3</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<collab>American Diabetes Association</collab>
</person-group>. <article-title>11. Microvascular complications and foot care: standards of medical care in diabetes-2019</article-title>. <source>Diabetes Care</source>. (<year>2019</year>) <volume>42</volume>:<page-range>S124&#x2013;s38</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.2337/dc19-S011</pub-id>
</citation>
</ref>
<ref id="B4">
<label>4</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname> <given-names>J</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>Q</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>D</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>Z</given-names>
</name>
</person-group>. <article-title>Exosomes: Advances, development and potential therapeutic strategies in diabetic nephropathy</article-title>. <source>Metabolism</source>. (<year>2021</year>) <volume>122</volume>:<elocation-id>154834</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.metabol.2021.154834</pub-id>
</citation>
</ref>
<ref id="B5">
<label>5</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Koye</surname> <given-names>DN</given-names>
</name>
<name>
<surname>Magliano</surname> <given-names>DJ</given-names>
</name>
<name>
<surname>Nelson</surname> <given-names>RG</given-names>
</name>
<name>
<surname>Pavkov</surname> <given-names>ME</given-names>
</name>
</person-group>. <article-title>The global epidemiology of diabetes and kidney disease</article-title>. <source>Adv Chronic Kidney Dis</source>. (<year>2018</year>) <volume>25</volume>:<page-range>121&#x2013;32</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1053/j.ackd.2017.10.011</pub-id>
</citation>
</ref>
<ref id="B6">
<label>6</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Thomas</surname> <given-names>MC</given-names>
</name>
<name>
<surname>Brownlee</surname> <given-names>M</given-names>
</name>
<name>
<surname>Susztak</surname> <given-names>K</given-names>
</name>
<name>
<surname>Sharma</surname> <given-names>K</given-names>
</name>
<name>
<surname>Jandeleit-Dahm</surname> <given-names>KA</given-names>
</name>
<name>
<surname>Zoungas</surname> <given-names>S</given-names>
</name>
<etal/>
</person-group>. <article-title>Diabetic kidney disease</article-title>. <source>Nat Rev Dis Primers</source>. (<year>2015</year>) <volume>1</volume>:<fpage>15018</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/nrdp.2015.18</pub-id>
</citation>
</ref>
<ref id="B7">
<label>7</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname> <given-names>XX</given-names>
</name>
<name>
<surname>Kong</surname> <given-names>J</given-names>
</name>
<name>
<surname>Yun</surname> <given-names>K</given-names>
</name>
</person-group>. <article-title>Prevalence of diabetic nephropathy among patients with type 2 diabetes mellitus in China: A meta-analysis of observational studies</article-title>. <source>J&#xa0;Diabetes Res</source>. (<year>2020</year>) <volume>2020</volume>:<elocation-id>2315607</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1155/2020/2315607</pub-id>
</citation>
</ref>
<ref id="B8">
<label>8</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Saputro</surname> <given-names>SA</given-names>
</name>
<name>
<surname>Pattanaprateep</surname> <given-names>O</given-names>
</name>
<name>
<surname>Pattanateepapon</surname> <given-names>A</given-names>
</name>
<name>
<surname>Karmacharya</surname> <given-names>S</given-names>
</name>
<name>
<surname>Thakkinstian</surname> <given-names>A</given-names>
</name>
</person-group>. <article-title>Prognostic models of diabetic microvascular complications: a systematic review and meta-analysis</article-title>. <source>Syst Rev</source>. (<year>2021</year>) <volume>10</volume>:<fpage>288</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s13643-021-01841-z</pub-id>
</citation>
</ref>
<ref id="B9">
<label>9</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hippisley-Cox</surname> <given-names>J</given-names>
</name>
<name>
<surname>Coupland</surname> <given-names>C</given-names>
</name>
<name>
<surname>Robson</surname> <given-names>J</given-names>
</name>
<name>
<surname>Sheikh</surname> <given-names>A</given-names>
</name>
<name>
<surname>Brindle</surname> <given-names>P</given-names>
</name>
</person-group>. <article-title>Predicting risk of type 2 diabetes in England and Wales: prospective derivation and validation of QDScore</article-title>. <source>Bmj</source>. (<year>2009</year>) <volume>338</volume>:<elocation-id>b880</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1136/bmj.b880</pub-id>
</citation>
</ref>
<ref id="B10">
<label>10</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Noble</surname> <given-names>D</given-names>
</name>
<name>
<surname>Mathur</surname> <given-names>R</given-names>
</name>
<name>
<surname>Dent</surname> <given-names>T</given-names>
</name>
<name>
<surname>Meads</surname> <given-names>C</given-names>
</name>
<name>
<surname>Greenhalgh</surname> <given-names>T</given-names>
</name>
</person-group>. <article-title>Risk models and scores for type 2 diabetes: systematic review</article-title>. <source>Bmj</source>. (<year>2011</year>) <volume>343</volume>:<elocation-id>d7163</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1136/bmj.d7163</pub-id>
</citation>
</ref>
<ref id="B11">
<label>11</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname> <given-names>L</given-names>
</name>
<name>
<surname>Magliano</surname> <given-names>DJ</given-names>
</name>
<name>
<surname>Zimmet</surname> <given-names>PZ</given-names>
</name>
</person-group>. <article-title>The worldwide epidemiology of type 2 diabetes mellitus&#x2013;present and future perspectives</article-title>. <source>Nat Rev Endocrinol</source>. (<year>2011</year>) <volume>8</volume>:<page-range>228&#x2013;36</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/nrendo.2011.183</pub-id>
</citation>
</ref>
<ref id="B12">
<label>12</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jacobs</surname> <given-names>PG</given-names>
</name>
<name>
<surname>Herrero</surname> <given-names>P</given-names>
</name>
<name>
<surname>Facchinetti</surname> <given-names>A</given-names>
</name>
<name>
<surname>Vehi</surname> <given-names>J</given-names>
</name>
<name>
<surname>Kovatchev</surname> <given-names>B</given-names>
</name>
<name>
<surname>Breton</surname> <given-names>MD</given-names>
</name>
<etal/>
</person-group>. <article-title>Artificial intelligence and machine learning for improving glycemic control in diabetes: best practices, pitfalls, and opportunities</article-title>. <source>IEEE Rev BioMed Eng</source>. (<year>2024</year>) <volume>17</volume>:<fpage>19</fpage>&#x2013;<lpage>41</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1109/rbme.2023.3331297</pub-id>
</citation>
</ref>
<ref id="B13">
<label>13</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rajkomar</surname> <given-names>A</given-names>
</name>
<name>
<surname>Dean</surname> <given-names>J</given-names>
</name>
<name>
<surname>Kohane</surname> <given-names>I</given-names>
</name>
</person-group>. <article-title>Machine learning in medicine</article-title>. <source>N Engl J Med</source>. (<year>2019</year>) <volume>380</volume>:<page-range>1347&#x2013;58</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1056/NEJMra1814259</pub-id>
</citation>
</ref>
<ref id="B14">
<label>14</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Obermeyer</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Emanuel</surname> <given-names>EJ</given-names>
</name>
</person-group>. <article-title>Predicting the future - big data, machine learning, and clinical medicine</article-title>. <source>N Engl J Med</source>. (<year>2016</year>) <volume>375</volume>:<page-range>1216&#x2013;9</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1056/NEJMp1606181</pub-id>
</citation>
</ref>
<ref id="B15">
<label>15</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tan</surname> <given-names>H</given-names>
</name>
<name>
<surname>Shi</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Yue</surname> <given-names>T</given-names>
</name>
<name>
<surname>Zheng</surname> <given-names>D</given-names>
</name>
<name>
<surname>Luo</surname> <given-names>S</given-names>
</name>
<name>
<surname>Weng</surname> <given-names>J</given-names>
</name>
<etal/>
</person-group>. <article-title>Machine learning approach reveals microbiome, metabolome, and lipidome profiles in type 1 diabetes</article-title>. <source>J Adv Res</source>. (<year>2023</year>) <volume>64</volume>:<page-range>213&#x2013;21</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.jare.2023.11.025</pub-id>
</citation>
</ref>
<ref id="B16">
<label>16</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Esteva</surname> <given-names>A</given-names>
</name>
<name>
<surname>Robicquet</surname> <given-names>A</given-names>
</name>
<name>
<surname>Ramsundar</surname> <given-names>B</given-names>
</name>
<name>
<surname>Kuleshov</surname> <given-names>V</given-names>
</name>
<name>
<surname>DePristo</surname> <given-names>M</given-names>
</name>
<name>
<surname>Chou</surname> <given-names>K</given-names>
</name>
<etal/>
</person-group>. <article-title>A guide to deep learning in healthcare</article-title>. <source>Nat Med</source>. (<year>2019</year>) <volume>25</volume>:<page-range>24&#x2013;9</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41591-018-0316-z</pub-id>
</citation>
</ref>
<ref id="B17">
<label>17</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kim</surname> <given-names>YK</given-names>
</name>
<name>
<surname>Na</surname> <given-names>KS</given-names>
</name>
</person-group>. <article-title>Application of machine learning classification for structural brain MRI in mood disorders: Critical review from a clinical perspective</article-title>. <source>Prog Neuropsychopharmacol Biol Psychiatry</source>. (<year>2018</year>) <volume>80</volume>:<fpage>71</fpage>&#x2013;<lpage>80</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.pnpbp.2017.06.024</pub-id>
</citation>
</ref>
<ref id="B18">
<label>18</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Slieker</surname> <given-names>RC</given-names>
</name>
<name>
<surname>M&#xfc;nch</surname> <given-names>M</given-names>
</name>
<name>
<surname>Donnelly</surname> <given-names>LA</given-names>
</name>
<name>
<surname>Bouland</surname> <given-names>GA</given-names>
</name>
<name>
<surname>Dragan</surname> <given-names>I</given-names>
</name>
<name>
<surname>Kuznetsov</surname> <given-names>D</given-names>
</name>
<etal/>
</person-group>. <article-title>An omics-based machine learning approach to predict diabetes progression: a RHAPSODY study</article-title>. <source>Diabetologia</source>. (<year>2024</year>) <volume>67</volume>:<page-range>885&#x2013;94</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s00125-024-06105-8</pub-id>
</citation>
</ref>
<ref id="B19">
<label>19</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jordan</surname> <given-names>MI</given-names>
</name>
<name>
<surname>Mitchell</surname> <given-names>TM</given-names>
</name>
</person-group>. <article-title>Machine learning: Trends, perspectives, and prospects</article-title>. <source>Science</source>. (<year>2015</year>) <volume>349</volume>:<page-range>255&#x2013;60</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1126/science.aaa8415</pub-id>
</citation>
</ref>
<ref id="B20">
<label>20</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Persson</surname> <given-names>F</given-names>
</name>
<name>
<surname>Rossing</surname> <given-names>P</given-names>
</name>
</person-group>. <article-title>Diagnosis of diabetic kidney disease: state of the art and future perspective</article-title>. <source>Kidney Int Suppl (2011)</source>. (<year>2018</year>) <volume>8</volume>:<fpage>2</fpage>&#x2013;<lpage>7</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.kisu.2017.10.003</pub-id>
</citation>
</ref>
<ref id="B21">
<label>21</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Colhoun</surname> <given-names>HM</given-names>
</name>
<name>
<surname>Marcovecchio</surname> <given-names>ML</given-names>
</name>
</person-group>. <article-title>Biomarkers of diabetic kidney disease</article-title>. <source>Diabetologia</source>. (<year>2018</year>) <volume>61</volume>:<fpage>996</fpage>&#x2013;<lpage>1011</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s00125-018-4567-5</pub-id>
</citation>
</ref>
<ref id="B22">
<label>22</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cole</surname> <given-names>JB</given-names>
</name>
<name>
<surname>Florez</surname> <given-names>JC</given-names>
</name>
</person-group>. <article-title>Genetics of diabetes mellitus and diabetes complications</article-title>. <source>Nat Rev Nephrol</source>. (<year>2020</year>) <volume>16</volume>:<page-range>377&#x2013;90</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41581-020-0278-5</pub-id>
</citation>
</ref>
<ref id="B23">
<label>23</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yip</surname> <given-names>W</given-names>
</name>
<name>
<surname>Ong</surname> <given-names>PG</given-names>
</name>
<name>
<surname>Teo</surname> <given-names>BW</given-names>
</name>
<name>
<surname>Cheung</surname> <given-names>CY</given-names>
</name>
<name>
<surname>Tai</surname> <given-names>ES</given-names>
</name>
<name>
<surname>Cheng</surname> <given-names>CY</given-names>
</name>
<etal/>
</person-group>. <article-title>Retinal vascular imaging markers and incident chronic kidney disease: A prospective cohort study</article-title>. <source>Sci Rep</source>. (<year>2017</year>) <volume>7</volume>:<fpage>9374</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41598-017-09204-2</pub-id>
</citation>
</ref>
<ref id="B24">
<label>24</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Eddy</surname> <given-names>S</given-names>
</name>
<name>
<surname>Mariani</surname> <given-names>LH</given-names>
</name>
<name>
<surname>Kretzler</surname> <given-names>M</given-names>
</name>
</person-group>. <article-title>Integrated multi-omics approaches to improve classification of chronic kidney disease</article-title>. <source>Nat Rev Nephrol</source>. (<year>2020</year>) <volume>16</volume>:<page-range>657&#x2013;68</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41581-020-0286-5</pub-id>
</citation>
</ref>
<ref id="B25">
<label>25</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lekha S</surname> <given-names>MS</given-names>
</name>
</person-group>. <article-title>Recent advancements and future prospects on E-nose sensors technology and machine learning approaches for non-invasive diabetes diagnosis: A review</article-title>. <source>IEEE Rev BioMed Eng</source>. (<year>2021</year>) <volume>14</volume>:<page-range>127&#x2013;38</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1109/rbme.2020.2993591</pub-id>
</citation>
</ref>
<ref id="B26">
<label>26</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sabanayagam</surname> <given-names>C</given-names>
</name>
<name>
<surname>He</surname> <given-names>F</given-names>
</name>
<name>
<surname>Nusinovici</surname> <given-names>S</given-names>
</name>
<name>
<surname>Li</surname> <given-names>J</given-names>
</name>
<name>
<surname>Lim</surname> <given-names>C</given-names>
</name>
<name>
<surname>Tan</surname> <given-names>G</given-names>
</name>
<etal/>
</person-group>. <article-title>Prediction of diabetic kidney disease risk using machine learning models: A population-based cohort study of Asian adults</article-title>. <source>Elife</source>. (<year>2023</year>) <volume>12</volume>:<elocation-id>e81878</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.7554/eLife.81878</pub-id>
</citation>
</ref>
<ref id="B27">
<label>27</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nicolucci</surname> <given-names>A</given-names>
</name>
<name>
<surname>Romeo</surname> <given-names>L</given-names>
</name>
<name>
<surname>Bernardini</surname> <given-names>M</given-names>
</name>
<name>
<surname>Vespasiani</surname> <given-names>M</given-names>
</name>
<name>
<surname>Rossi</surname> <given-names>MC</given-names>
</name>
<name>
<surname>Petrelli</surname> <given-names>M</given-names>
</name>
<etal/>
</person-group>. <article-title>Prediction of complications of type 2 Diabetes: A Machine learning approach</article-title>. <source>Diabetes Res Clin Pract</source>. (<year>2022</year>) <volume>190</volume>:<elocation-id>110013</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.diabres.2022.110013</pub-id>
</citation>
</ref>
<ref id="B28">
<label>28</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Page</surname> <given-names>MJ</given-names>
</name>
<name>
<surname>McKenzie</surname> <given-names>JE</given-names>
</name>
<name>
<surname>Bossuyt</surname> <given-names>PM</given-names>
</name>
<name>
<surname>Boutron</surname> <given-names>I</given-names>
</name>
<name>
<surname>Hoffmann</surname> <given-names>TC</given-names>
</name>
<name>
<surname>Mulrow</surname> <given-names>CD</given-names>
</name>
<etal/>
</person-group>. <article-title>The PRISMA 2020 statement: an updated guideline for reporting systematic reviews</article-title>. <source>Bmj</source>. (<year>2021</year>) <volume>372</volume>:<elocation-id>n71</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1136/bmj.n71</pub-id>
</citation>
</ref>
<ref id="B29">
<label>29</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Moons</surname> <given-names>KG</given-names>
</name>
<name>
<surname>de Groot</surname> <given-names>JA</given-names>
</name>
<name>
<surname>Bouwmeester</surname> <given-names>W</given-names>
</name>
<name>
<surname>Vergouwe</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Mallett</surname> <given-names>S</given-names>
</name>
<name>
<surname>Altman</surname> <given-names>DG</given-names>
</name>
<etal/>
</person-group>. <article-title>Critical appraisal and data extraction for systematic reviews of prediction modelling studies: the CHARMS checklist</article-title>. <source>PloS Med</source>. (<year>2014</year>) <volume>11</volume>:<elocation-id>e1001744</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1371/journal.pmed.1001744</pub-id>
</citation>
</ref>
<ref id="B30">
<label>30</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Canellas</surname> <given-names>J</given-names>
</name>
<name>
<surname>Ritto</surname> <given-names>FG</given-names>
</name>
<name>
<surname>Rodolico</surname> <given-names>A</given-names>
</name>
<name>
<surname>Aguglia</surname> <given-names>E</given-names>
</name>
<name>
<surname>Fernandes</surname> <given-names>GVO</given-names>
</name>
<name>
<surname>Figueredo</surname> <given-names>C</given-names>
</name>
<etal/>
</person-group>. <article-title>The international platform of registered systematic review and meta-analysis protocols (INPLASY) at 3 years: an analysis of 4,658 registered protocols on inplasy.com, platform features, and website statistics</article-title>. <source>Front Res Metr Anal</source>. (<year>2023</year>) <volume>8</volume>:<elocation-id>1135853</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/frma.2023.1135853</pub-id>
</citation>
</ref>
<ref id="B31">
<label>31</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<collab>American Diabetes Association</collab>
</person-group>. <article-title>2. Classification and diagnosis of diabetes: standards of medical care in diabetes-2018</article-title>. <source>Diabetes Care</source>. (<year>2018</year>) <volume>41</volume>:<fpage>S13</fpage>&#x2013;<lpage>s27</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.2337/dc18-S002</pub-id>
</citation>
</ref>
<ref id="B32">
<label>32</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Collins</surname> <given-names>GS</given-names>
</name>
<name>
<surname>Moons</surname> <given-names>KGM</given-names>
</name>
<name>
<surname>Dhiman</surname> <given-names>P</given-names>
</name>
<name>
<surname>Riley</surname> <given-names>RD</given-names>
</name>
<name>
<surname>Beam</surname> <given-names>AL</given-names>
</name>
<name>
<surname>Van Calster</surname> <given-names>B</given-names>
</name>
<etal/>
</person-group>. <article-title>TRIPOD+AI statement: updated guidance for reporting clinical prediction models that use regression or machine learning methods</article-title>. <source>Bmj</source>. (<year>2024</year>) <volume>385</volume>:<elocation-id>e078378</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1136/bmj-2023-078378</pub-id>
</citation>
</ref>
<ref id="B33">
<label>33</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Moons</surname> <given-names>KGM</given-names>
</name>
<name>
<surname>Wolff</surname> <given-names>RF</given-names>
</name>
<name>
<surname>Riley</surname> <given-names>RD</given-names>
</name>
<name>
<surname>Whiting</surname> <given-names>PF</given-names>
</name>
<name>
<surname>Westwood</surname> <given-names>M</given-names>
</name>
<name>
<surname>Collins</surname> <given-names>GS</given-names>
</name>
<etal/>
</person-group>. <article-title>PROBAST: A tool to assess risk of bias and applicability of prediction model studies: explanation and elaboration</article-title>. <source>Ann Intern Med</source>. (<year>2019</year>) <volume>170</volume>:<fpage>W1</fpage>&#x2013;<lpage>w33</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.7326/m18-1377</pub-id>
</citation>
</ref>
<ref id="B34">
<label>34</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Debray</surname> <given-names>TP</given-names>
</name>
<name>
<surname>Damen</surname> <given-names>JA</given-names>
</name>
<name>
<surname>Riley</surname> <given-names>RD</given-names>
</name>
<name>
<surname>Snell</surname> <given-names>K</given-names>
</name>
<name>
<surname>Reitsma</surname> <given-names>JB</given-names>
</name>
<name>
<surname>Hooft</surname> <given-names>L</given-names>
</name>
<etal/>
</person-group>. <article-title>A framework for meta-analysis of prediction model studies with binary and time-to-event outcomes</article-title>. <source>Stat Methods Med Res</source>. (<year>2019</year>) <volume>28</volume>:<page-range>2768&#x2013;86</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1177/0962280218785504</pub-id>
</citation>
</ref>
<ref id="B35">
<label>35</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hanley</surname> <given-names>JA</given-names>
</name>
<name>
<surname>McNeil</surname> <given-names>BJ</given-names>
</name>
</person-group>. <article-title>The meaning and use of the area under a receiver operating characteristic (ROC) curve</article-title>. <source>Radiology</source>. (<year>1982</year>) <volume>143</volume>:<fpage>29</fpage>&#x2013;<lpage>36</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1148/radiology.143.1.7063747</pub-id>
</citation>
</ref>
<ref id="B36">
<label>36</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Altman</surname> <given-names>DG</given-names>
</name>
<name>
<surname>Bland</surname> <given-names>JM</given-names>
</name>
</person-group>. <article-title>How to obtain the confidence interval from a P value</article-title>. <source>Bmj</source>. (<year>2011</year>) <volume>343</volume>:<elocation-id>d2090</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1136/bmj.d2090</pub-id>
</citation>
</ref>
<ref id="B37">
<label>37</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>DerSimonian</surname> <given-names>R</given-names>
</name>
<name>
<surname>Laird</surname> <given-names>N</given-names>
</name>
</person-group>. <article-title>Meta-analysis in clinical trials revisited</article-title>. <source>Contemp Clin Trials</source>. (<year>2015</year>) <volume>45</volume>:<page-range>139&#x2013;45</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.cct.2015.09.002</pub-id>
</citation>
</ref>
<ref id="B38">
<label>38</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Thorlund</surname> <given-names>K</given-names>
</name>
<name>
<surname>Wetterslev</surname> <given-names>J</given-names>
</name>
<name>
<surname>Awad</surname> <given-names>T</given-names>
</name>
<name>
<surname>Thabane</surname> <given-names>L</given-names>
</name>
<name>
<surname>Gluud</surname> <given-names>C</given-names>
</name>
</person-group>. <article-title>Comparison of statistical inferences from the DerSimonian-Laird and alternative random-effects model meta-analyses - an empirical assessment of 920 Cochrane primary outcome meta-analyses</article-title>. <source>Res Synth Methods</source>. (<year>2011</year>) <volume>2</volume>:<page-range>238&#x2013;53</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/jrsm.53</pub-id>
</citation>
</ref>
<ref id="B39">
<label>39</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhao</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>L</given-names>
</name>
<name>
<surname>Zuo</surname> <given-names>L</given-names>
</name>
<name>
<surname>Zhou</surname> <given-names>X</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>S</given-names>
</name>
<name>
<surname>Gao</surname> <given-names>H</given-names>
</name>
<etal/>
</person-group>. <article-title>A novel risk score model for the differential diagnosis of type 2 diabetic nephropathy: A multicenter study</article-title>. <source>J Diabetes Res</source>. (<year>2023</year>) <volume>2023</volume>:<elocation-id>5514767</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1155/2023/5514767</pub-id>
</citation>
</ref>
<ref id="B40">
<label>40</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname> <given-names>S</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>R</given-names>
</name>
<name>
<surname>Shang</surname> <given-names>X</given-names>
</name>
<name>
<surname>Li</surname> <given-names>W</given-names>
</name>
</person-group>. <article-title>Analysis for warning factors of type 2 diabetes mellitus complications with Markov blanket based on a Bayesian network model</article-title>. <source>Comput Methods Programs Biomed</source>. (<year>2020</year>) <volume>188</volume>:<elocation-id>105302</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.cmpb.2019.105302</pub-id>
</citation>
</ref>
<ref id="B41">
<label>41</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hui</surname> <given-names>D</given-names>
</name>
<name>
<surname>Sun</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Xu</surname> <given-names>S</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>J</given-names>
</name>
<name>
<surname>He</surname> <given-names>P</given-names>
</name>
<name>
<surname>Deng</surname> <given-names>Y</given-names>
</name>
<etal/>
</person-group>. <article-title>Analysis of clinical predictors of kidney diseases in type 2 diabetes patients based on machine learning</article-title>. <source>Int Urol Nephrol</source>. (<year>2023</year>) <volume>55</volume>:<page-range>687&#x2013;96</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s11255-022-03322-1</pub-id>
</citation>
</ref>
<ref id="B42">
<label>42</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Momenzadeh</surname> <given-names>A</given-names>
</name>
<name>
<surname>Shamsa</surname> <given-names>A</given-names>
</name>
<name>
<surname>Meyer</surname> <given-names>JG</given-names>
</name>
</person-group>. <article-title>Bias or biology? Importance of model interpretation in machine learning studies from electronic health records</article-title>. <source>JAMIA Open</source>. (<year>2022</year>) <volume>5</volume>:<elocation-id>ooac063</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/jamiaopen/ooac063</pub-id>
</citation>
</ref>
<ref id="B43">
<label>43</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cai</surname> <given-names>SS</given-names>
</name>
<name>
<surname>Zheng</surname> <given-names>TY</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>KY</given-names>
</name>
<name>
<surname>Zhu</surname> <given-names>HP</given-names>
</name>
</person-group>. <article-title>Clinical study of different prediction models in predicting diabetic nephropathy in patients with type 2 diabetes mellitus</article-title>. <source>World J Diabetes</source>. (<year>2024</year>) <volume>15</volume>:<fpage>43</fpage>&#x2013;<lpage>52</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.4239/wjd.v15.i1.43</pub-id>
</citation>
</ref>
<ref id="B44">
<label>44</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Betzler</surname> <given-names>BK</given-names>
</name>
<name>
<surname>Chee</surname> <given-names>EYL</given-names>
</name>
<name>
<surname>He</surname> <given-names>F</given-names>
</name>
<name>
<surname>Lim</surname> <given-names>CC</given-names>
</name>
<name>
<surname>Ho</surname> <given-names>J</given-names>
</name>
<name>
<surname>Hamzah</surname> <given-names>H</given-names>
</name>
<etal/>
</person-group>. <article-title>Deep learning algorithms to detect diabetic kidney disease from retinal photographs in multiethnic populations with diabetes</article-title>. <source>J Am Med Inform Assoc</source>. (<year>2023</year>) <volume>30</volume>:<page-range>1904&#x2013;14</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/jamia/ocad179</pub-id>
</citation>
</ref>
<ref id="B45">
<label>45</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>He</surname> <given-names>F</given-names>
</name>
<name>
<surname>Ng Yin Ling</surname> <given-names>C</given-names>
</name>
<name>
<surname>Nusinovici</surname> <given-names>S</given-names>
</name>
<name>
<surname>Cheng</surname> <given-names>CY</given-names>
</name>
<name>
<surname>Wong</surname> <given-names>TY</given-names>
</name>
<name>
<surname>Li</surname> <given-names>J</given-names>
</name>
<etal/>
</person-group>. <article-title>Development and external validation of machine learning models for diabetic microvascular complications: cross-sectional study with metabolites</article-title>. <source>J Med Internet Res</source>. (<year>2024</year>) <volume>26</volume>:<elocation-id>e41065</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.2196/41065</pub-id>
</citation>
</ref>
<ref id="B46">
<label>46</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hosseini Sarkhosh</surname> <given-names>SM</given-names>
</name>
<name>
<surname>Hemmatabadi</surname> <given-names>M</given-names>
</name>
<name>
<surname>Esteghamati</surname> <given-names>A</given-names>
</name>
</person-group>. <article-title>Development and validation of a risk score for diabetic kidney disease prediction in type 2 diabetes patients: a machine learning approach</article-title>. <source>J Endocrinol Invest</source>. (<year>2023</year>) <volume>46</volume>:<page-range>415&#x2013;23</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s40618-022-01919-y</pub-id>
</citation>
</ref>
<ref id="B47">
<label>47</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Afrash</surname> <given-names>MR</given-names>
</name>
<name>
<surname>Rahimi</surname> <given-names>F</given-names>
</name>
<name>
<surname>Kazemi-Arpanahi</surname> <given-names>H</given-names>
</name>
<name>
<surname>Shanbezadeh</surname> <given-names>M</given-names>
</name>
<name>
<surname>Amraei</surname> <given-names>M</given-names>
</name>
<name>
<surname>Asadi</surname> <given-names>F</given-names>
</name>
</person-group>. <article-title>Development of an intelligent clinical decision support system for the early prediction of diabetic nephropathy</article-title>. <source>Inf Med Unlocked</source>. (<year>2022</year>) <volume>35</volume>:<elocation-id>101135</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.imu.2022.101135</pub-id>
</citation>
</ref>
<ref id="B48">
<label>48</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yang</surname> <given-names>D</given-names>
</name>
<name>
<surname>Tian</surname> <given-names>C</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>J</given-names>
</name>
<name>
<surname>Peng</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Xiong</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Da</surname> <given-names>J</given-names>
</name>
<etal/>
</person-group>. <article-title>Diffusion tensor and kurtosis MRI-based radiomics analysis of kidney injury in type 2 diabetes</article-title>. <source>J Magn Reson Imaging</source>. (<year>2024</year>) <volume>60</volume>(<issue>5</issue>):<fpage>2078</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/jmri.29263</pub-id>
</citation>
</ref>
<ref id="B49">
<label>49</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yin</surname> <given-names>JM</given-names>
</name>
<name>
<surname>Li</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Xue</surname> <given-names>JT</given-names>
</name>
<name>
<surname>Zong</surname> <given-names>GW</given-names>
</name>
<name>
<surname>Fang</surname> <given-names>ZZ</given-names>
</name>
<name>
<surname>Zou</surname> <given-names>L</given-names>
</name>
</person-group>. <article-title>Explainable machine learning-based prediction model for diabetic nephropathy</article-title>. <source>J Diabetes Res</source>. (<year>2024</year>) <volume>2024</volume>:<elocation-id>8857453</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1155/2024/8857453</pub-id>
</citation>
</ref>
<ref id="B50">
<label>50</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Song</surname> <given-names>X</given-names>
</name>
<name>
<surname>Waitman</surname> <given-names>LR</given-names>
</name>
<name>
<surname>Yu</surname> <given-names>AS</given-names>
</name>
<name>
<surname>Robbins</surname> <given-names>DC</given-names>
</name>
<name>
<surname>Hu</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>M</given-names>
</name>
</person-group>. <article-title>Longitudinal risk prediction of chronic kidney disease in diabetic patients using a temporal-enhanced gradient boosting machine: retrospective cohort study</article-title>. <source>JMIR Med Inform</source>. (<year>2020</year>) <volume>8</volume>:<elocation-id>e15510</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.2196/15510</pub-id>
</citation>
</ref>
<ref id="B51">
<label>51</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fan</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Long</surname> <given-names>E</given-names>
</name>
<name>
<surname>Cai</surname> <given-names>L</given-names>
</name>
<name>
<surname>Cao</surname> <given-names>Q</given-names>
</name>
<name>
<surname>Wu</surname> <given-names>X</given-names>
</name>
<name>
<surname>Tong</surname> <given-names>R</given-names>
</name>
</person-group>. <article-title>Machine learning approaches to predict risks of diabetic complications and poor glycemic control in nonadherent type 2 diabetes</article-title>. <source>Front Pharmacol</source>. (<year>2021</year>) <volume>12</volume>:<elocation-id>665951</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fphar.2021.665951</pub-id>
</citation>
</ref>
<ref id="B52">
<label>52</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname> <given-names>W</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>X</given-names>
</name>
<name>
<surname>Dong</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>Q</given-names>
</name>
<name>
<surname>Pei</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>Y</given-names>
</name>
<etal/>
</person-group>. <article-title>New diagnostic model for the differentiation of diabetic nephropathy from non-diabetic nephropathy in chinese patients</article-title>. <source>Front Endocrinol (Lausanne)</source>. (<year>2022</year>) <volume>13</volume>:<elocation-id>913021</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fendo.2022.913021</pub-id>
</citation>
</ref>
<ref id="B53">
<label>53</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname> <given-names>XZ</given-names>
</name>
<name>
<surname>Duan</surname> <given-names>M</given-names>
</name>
<name>
<surname>Huang</surname> <given-names>HD</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Xiang</surname> <given-names>TY</given-names>
</name>
<name>
<surname>Niu</surname> <given-names>WC</given-names>
</name>
<etal/>
</person-group>. <article-title>Predicting diabetic kidney disease for type 2 diabetes mellitus by machine learning in the real world: a multicenter retrospective study</article-title>. <source>Front Endocrinol (Lausanne)</source>. (<year>2023</year>) <volume>14</volume>:<elocation-id>1184190</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fendo.2023.1184190</pub-id>
</citation>
</ref>
<ref id="B54">
<label>54</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hosseini Sarkhosh</surname> <given-names>SM</given-names>
</name>
<name>
<surname>Esteghamati</surname> <given-names>A</given-names>
</name>
<name>
<surname>Hemmatabadi</surname> <given-names>M</given-names>
</name>
<name>
<surname>Daraei</surname> <given-names>M</given-names>
</name>
</person-group>. <article-title>Predicting diabetic nephropathy in type 2 diabetic patients using machine learning algorithms</article-title>. <source>J Diabetes Metab Disord</source>. (<year>2022</year>) <volume>21</volume>:<page-range>1433&#x2013;41</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s40200-022-01076-2</pub-id>
</citation>
</ref>
<ref id="B55">
<label>55</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dong</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>Q</given-names>
</name>
<name>
<surname>Ke</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>W</given-names>
</name>
<name>
<surname>Hong</surname> <given-names>Q</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>C</given-names>
</name>
<etal/>
</person-group>. <article-title>Prediction of 3-year risk of diabetic kidney disease using machine learning based on electronic medical records</article-title>. <source>J Transl Med</source>. (<year>2022</year>) <volume>20</volume>:<fpage>143</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s12967-022-03339-1</pub-id>
</citation>
</ref>
<ref id="B56">
<label>56</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Allen</surname> <given-names>A</given-names>
</name>
<name>
<surname>Iqbal</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Green-Saxena</surname> <given-names>A</given-names>
</name>
<name>
<surname>Hurtado</surname> <given-names>M</given-names>
</name>
<name>
<surname>Hoffman</surname> <given-names>J</given-names>
</name>
<name>
<surname>Mao</surname> <given-names>Q</given-names>
</name>
<etal/>
</person-group>. <article-title>Prediction of diabetic kidney disease with machine learning algorithms, upon the initial diagnosis of type 2 diabetes mellitus</article-title>. <source>BMJ Open Diabetes Res Care</source>. (<year>2022</year>) <volume>10</volume>:<elocation-id>e002560</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1136/bmjdrc-2021-002560</pub-id>
</citation>
</ref>
<ref id="B57">
<label>57</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Maniruzzaman</surname> <given-names>M</given-names>
</name>
<name>
<surname>Islam</surname> <given-names>MM</given-names>
</name>
<name>
<surname>Rahman</surname> <given-names>MJ</given-names>
</name>
<name>
<surname>Hasan</surname> <given-names>MAM</given-names>
</name>
<name>
<surname>Shin</surname> <given-names>J</given-names>
</name>
</person-group>. <article-title>Risk prediction&#xa0;of diabetic nephropathy using machine learning techniques: A pilot study&#xa0;with secondary data</article-title>. <source>Diabetes Metab Syndr</source>. (<year>2021</year>) <volume>15</volume>:<elocation-id>102263</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.dsx.2021.102263</pub-id>
</citation>
</ref>
<ref id="B58">
<label>58</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Song</surname> <given-names>X</given-names>
</name>
<name>
<surname>Waitman</surname> <given-names>LR</given-names>
</name>
<name>
<surname>Hu</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Yu</surname> <given-names>ASL</given-names>
</name>
<name>
<surname>Robbins</surname> <given-names>DC</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>M</given-names>
</name>
</person-group>. <article-title>Robust clinical marker identification for diabetic kidney disease with ensemble feature selection</article-title>. <source>J Am Med Inform Assoc</source>. (<year>2019</year>) <volume>26</volume>:<page-range>242&#x2013;53</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/jamia/ocy165</pub-id>
</citation>
</ref>
<ref id="B59">
<label>59</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname> <given-names>G</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>B</given-names>
</name>
<name>
<surname>Qiao</surname> <given-names>G</given-names>
</name>
<name>
<surname>Lou</surname> <given-names>H</given-names>
</name>
<name>
<surname>Xu</surname> <given-names>F</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>Z</given-names>
</name>
<etal/>
</person-group>. <article-title>Screening tools based on nomogram for diabetic kidney diseases in chinese type 2 diabetes mellitus patients</article-title>. <source>Diabetes Metab J</source>. (<year>2021</year>) <volume>45</volume>:<page-range>708&#x2013;18</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.4093/dmj.2020.0117</pub-id>
</citation>
</ref>
<ref id="B60">
<label>60</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shi</surname> <given-names>S</given-names>
</name>
<name>
<surname>Gao</surname> <given-names>L</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>J</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>B</given-names>
</name>
<name>
<surname>Xiao</surname> <given-names>J</given-names>
</name>
<name>
<surname>Xu</surname> <given-names>W</given-names>
</name>
<etal/>
</person-group>. <article-title>The automatic detection of diabetic kidney disease from retinal vascular parameters combined with clinical variables using artificial intelligence in type-2 diabetes patients</article-title>. <source>BMC Med Inform Decis Mak</source>. (<year>2023</year>) <volume>23</volume>:<fpage>241</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s12911-023-02343-9</pub-id>
</citation>
</ref>
<ref id="B61">
<label>61</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Leung</surname> <given-names>RK</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Ma</surname> <given-names>RC</given-names>
</name>
<name>
<surname>Luk</surname> <given-names>AO</given-names>
</name>
<name>
<surname>Lam</surname> <given-names>V</given-names>
</name>
<name>
<surname>Ng</surname> <given-names>M</given-names>
</name>
<etal/>
</person-group>. <article-title>Using a multi-staged strategy based on machine learning and mathematical modeling to predict genotype-phenotype risk patterns in diabetic kidney disease: a prospective case-control cohort analysis</article-title>. <source>BMC Nephrol</source>. (<year>2013</year>) <volume>14</volume>:<elocation-id>162</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/1471-2369-14-162</pub-id>
</citation>
</ref>
<ref id="B62">
<label>62</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Su</surname> <given-names>X</given-names>
</name>
<name>
<surname>Lin</surname> <given-names>S</given-names>
</name>
<name>
<surname>Huang</surname> <given-names>Y</given-names>
</name>
</person-group>. <article-title>Value of radiomics-based two-dimensional ultrasound for diagnosing early diabetic nephropathy</article-title>. <source>Sci Rep</source>. (<year>2023</year>) <volume>13</volume>:<fpage>20427</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41598-023-47449-2</pub-id>
</citation>
</ref>
<ref id="B63">
<label>63</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Levin</surname> <given-names>A</given-names>
</name>
<name>
<surname>Stevens</surname> <given-names>PE</given-names>
</name>
</person-group>. <article-title>Early detection of CKD: the benefits, limitations and effects on prognosis</article-title>. <source>Nat Rev Nephrol</source>. (<year>2011</year>) <volume>7</volume>:<page-range>446&#x2013;57</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/nrneph.2011.86</pub-id>
</citation>
</ref>
<ref id="B64">
<label>64</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Collins</surname> <given-names>GS</given-names>
</name>
<name>
<surname>de Groot</surname> <given-names>JA</given-names>
</name>
<name>
<surname>Dutton</surname> <given-names>S</given-names>
</name>
<name>
<surname>Omar</surname> <given-names>O</given-names>
</name>
<name>
<surname>Shanyinde</surname> <given-names>M</given-names>
</name>
<name>
<surname>Tajar</surname> <given-names>A</given-names>
</name>
<etal/>
</person-group>. <article-title>External validation of multivariable prediction models: a systematic review of methodological conduct and reporting</article-title>. <source>BMC Med Res Methodol</source>. (<year>2014</year>) <volume>14</volume>:<elocation-id>40</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/1471-2288-14-40</pub-id>
</citation>
</ref>
<ref id="B65">
<label>65</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Steyerberg</surname> <given-names>EW</given-names>
</name>
<name>
<surname>Moons</surname> <given-names>KG</given-names>
</name>
<name>
<surname>van der Windt</surname> <given-names>DA</given-names>
</name>
<name>
<surname>Hayden</surname> <given-names>JA</given-names>
</name>
<name>
<surname>Perel</surname> <given-names>P</given-names>
</name>
<name>
<surname>Schroter</surname> <given-names>S</given-names>
</name>
<etal/>
</person-group>. <article-title>Prognosis Research Strategy (PROGRESS) 3: prognostic model research</article-title>. <source>PloS Med</source>. (<year>2013</year>) <volume>10</volume>:<elocation-id>e1001381</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1371/journal.pmed.1001381</pub-id>
</citation>
</ref>
<ref id="B66">
<label>66</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Siontis</surname> <given-names>GC</given-names>
</name>
<name>
<surname>Tzoulaki</surname> <given-names>I</given-names>
</name>
<name>
<surname>Castaldi</surname> <given-names>PJ</given-names>
</name>
<name>
<surname>Ioannidis</surname> <given-names>JP</given-names>
</name>
</person-group>. <article-title>External validation of new risk prediction models is infrequent and reveals worse prognostic discrimination</article-title>. <source>J Clin Epidemiol</source>. (<year>2015</year>) <volume>68</volume>:<fpage>25</fpage>&#x2013;<lpage>34</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.jclinepi.2014.09.007</pub-id>
</citation>
</ref>
<ref id="B67">
<label>67</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bates</surname> <given-names>DW</given-names>
</name>
<name>
<surname>Auerbach</surname> <given-names>A</given-names>
</name>
<name>
<surname>Schulam</surname> <given-names>P</given-names>
</name>
<name>
<surname>Wright</surname> <given-names>A</given-names>
</name>
<name>
<surname>Saria</surname> <given-names>S</given-names>
</name>
</person-group>. <article-title>Reporting and implementing interventions involving machine learning and artificial intelligence</article-title>. <source>Ann Intern Med</source>. (<year>2020</year>) <volume>172</volume>:<page-range>S137&#x2013;s44</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.7326/m19-0872</pub-id>
</citation>
</ref>
<ref id="B68">
<label>68</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Moons</surname> <given-names>KG</given-names>
</name>
<name>
<surname>Kengne</surname> <given-names>AP</given-names>
</name>
<name>
<surname>Grobbee</surname> <given-names>DE</given-names>
</name>
<name>
<surname>Royston</surname> <given-names>P</given-names>
</name>
<name>
<surname>Vergouwe</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Altman</surname> <given-names>DG</given-names>
</name>
<etal/>
</person-group>. <article-title>Risk prediction models: II. External validation, model updating, and impact assessment</article-title>. <source>Heart</source>. (<year>2012</year>) <volume>98</volume>:<page-range>691&#x2013;8</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1136/heartjnl-2011-301247</pub-id>
</citation>
</ref>
<ref id="B69">
<label>69</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>la-Roi-Teeuw</surname> <given-names>HM</given-names>
</name>
<name>
<surname>van Royen</surname> <given-names>FS</given-names>
</name>
<name>
<surname>de Hond</surname> <given-names>A</given-names>
</name>
<name>
<surname>Zahra</surname> <given-names>A</given-names>
</name>
<name>
<surname>de Vries</surname> <given-names>S</given-names>
</name>
<name>
<surname>Bartels</surname> <given-names>R</given-names>
</name>
<etal/>
</person-group>. <article-title>Don't be misled: 3 misconceptions about external validation of clinical prediction models</article-title>. <source>J Clin Epidemiol</source>. (<year>2024</year>) <volume>172</volume>:<elocation-id>111387</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.jclinepi.2024.111387</pub-id>
</citation>
</ref>
<ref id="B70">
<label>70</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Riley</surname> <given-names>RD</given-names>
</name>
<name>
<surname>Archer</surname> <given-names>L</given-names>
</name>
<name>
<surname>Snell</surname> <given-names>KIE</given-names>
</name>
<name>
<surname>Ensor</surname> <given-names>J</given-names>
</name>
<name>
<surname>Dhiman</surname> <given-names>P</given-names>
</name>
<name>
<surname>Martin</surname> <given-names>GP</given-names>
</name>
<etal/>
</person-group>. <article-title>Evaluation of clinical prediction models (part 2): how to undertake an external validation study</article-title>. <source>Bmj</source>. (<year>2024</year>) <volume>384</volume>:<elocation-id>e074820</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1136/bmj-2023-074820</pub-id>
</citation>
</ref>
<ref id="B71">
<label>71</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Smith</surname> <given-names>LA</given-names>
</name>
<name>
<surname>Oakden-Rayner</surname> <given-names>L</given-names>
</name>
<name>
<surname>Bird</surname> <given-names>A</given-names>
</name>
<name>
<surname>Zeng</surname> <given-names>M</given-names>
</name>
<name>
<surname>To</surname> <given-names>MS</given-names>
</name>
<name>
<surname>Mukherjee</surname> <given-names>S</given-names>
</name>
<etal/>
</person-group>. <article-title>Machine learning and deep learning predictive models for long-term prognosis in patients with chronic obstructive pulmonary disease: a systematic review and meta-analysis</article-title>. <source>Lancet Digit Health</source>. (<year>2023</year>) <volume>5</volume>:<page-range>e872&#x2013;e81</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/s2589-7500(23)00177-2</pub-id>
</citation>
</ref>
<ref id="B72">
<label>72</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tu</surname> <given-names>JV</given-names>
</name>
</person-group>. <article-title>Advantages and disadvantages of using artificial neural networks versus&#xa0;logistic regression for predicting medical outcomes</article-title>. <source>J Clin Epidemiol</source>. (<year>1996</year>) <volume>49</volume>:<page-range>1225&#x2013;31</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/s0895-4356(96)00002-9</pub-id>
</citation>
</ref>
<ref id="B73">
<label>73</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>LeCun</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Bengio</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Hinton</surname> <given-names>G</given-names>
</name>
</person-group>. <article-title>Deep learning</article-title>. <source>Nature</source>. (<year>2015</year>) <volume>521</volume>:<page-range>436&#x2013;44</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/nature14539</pub-id>
</citation>
</ref>
<ref id="B74">
<label>74</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fogo</surname> <given-names>AB</given-names>
</name>
</person-group>. <article-title>Learning from deep learning and pathomics</article-title>. <source>Kidney Int</source>. (<year>2023</year>) <volume>104</volume>:<page-range>1050&#x2013;3</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.kint.2023.06.006</pub-id>
</citation>
</ref>
<ref id="B75">
<label>75</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname> <given-names>J</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>H</given-names>
</name>
<name>
<surname>Hang</surname> <given-names>H</given-names>
</name>
<name>
<surname>Ma</surname> <given-names>S</given-names>
</name>
<name>
<surname>Shen</surname> <given-names>X</given-names>
</name>
<name>
<surname>Shi</surname> <given-names>Y</given-names>
</name>
</person-group>. <article-title>Self-supervised random forest on transformed distribution for anomaly detection</article-title>. <source>IEEE Trans Neural Netw Learn Syst</source>. (<year>2024</year>) <volume>36</volume>:<page-range>2675&#x2013;89</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1109/tnnls.2023.3348833</pub-id>
</citation>
</ref>
<ref id="B76">
<label>76</label>
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Breiman</surname> <given-names>L</given-names>
</name>
</person-group>. <source>Manual on setting up, using, and understanding random forests v3. 1</source> Vol. <volume>1</volume>. <publisher-name>Statistics Department University of California Berkeley, CA, USA</publisher-name> (<year>2002</year>) p. <fpage>3</fpage>&#x2013;<lpage>42</lpage>.</citation>
</ref>
<ref id="B77">
<label>77</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Speiser</surname> <given-names>JL</given-names>
</name>
<name>
<surname>Miller</surname> <given-names>ME</given-names>
</name>
<name>
<surname>Tooze</surname> <given-names>J</given-names>
</name>
<name>
<surname>Ip</surname> <given-names>E</given-names>
</name>
</person-group>. <article-title>A comparison of random forest variable selection methods for classification prediction modeling</article-title>. <source>Expert Syst Appl</source>. (<year>2019</year>) <volume>134</volume>:<fpage>93</fpage>&#x2013;<lpage>101</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.eswa.2019.05.028</pub-id>
</citation>
</ref>
<ref id="B78">
<label>78</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Paul</surname> <given-names>A</given-names>
</name>
<name>
<surname>Mukherjee</surname> <given-names>DP</given-names>
</name>
<name>
<surname>Das</surname> <given-names>P</given-names>
</name>
<name>
<surname>Gangopadhyay</surname> <given-names>A</given-names>
</name>
<name>
<surname>Chintha</surname> <given-names>AR</given-names>
</name>
<name>
<surname>Kundu</surname> <given-names>S</given-names>
</name>
</person-group>. <article-title>Improved random forest for classification</article-title>. <source>IEEE Trans Image Process</source>. (<year>2018</year>) <volume>27</volume>:<page-range>4012&#x2013;24</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1109/tip.2018.2834830</pub-id>
</citation>
</ref>
<ref id="B79">
<label>79</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Feng</surname> <given-names>J</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>Q</given-names>
</name>
<name>
<surname>Wu</surname> <given-names>F</given-names>
</name>
<name>
<surname>Peng</surname> <given-names>J</given-names>
</name>
<name>
<surname>Li</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>Z</given-names>
</name>
</person-group>. <article-title>The value of applying machine learning in predicting the time of symptom onset in stroke patients: systematic review and meta-analysis</article-title>. <source>J Med Internet Res</source>. (<year>2023</year>) <volume>25</volume>:<elocation-id>e44895</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.2196/44895</pub-id>
</citation>
</ref>
<ref id="B80">
<label>80</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wu</surname> <given-names>JH</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>TYA</given-names>
</name>
<name>
<surname>Hsu</surname> <given-names>WT</given-names>
</name>
<name>
<surname>Ho</surname> <given-names>JH</given-names>
</name>
<name>
<surname>Lee</surname> <given-names>CC</given-names>
</name>
</person-group>. <article-title>Performance and limitation of machine learning algorithms for diabetic retinopathy screening: meta-analysis</article-title>. <source>J Med Internet Res</source>. (<year>2021</year>) <volume>23</volume>:<elocation-id>e23863</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.2196/23863</pub-id>
</citation>
</ref>
<ref id="B81">
<label>81</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Alicic</surname> <given-names>RZ</given-names>
</name>
<name>
<surname>Rooney</surname> <given-names>MT</given-names>
</name>
<name>
<surname>Tuttle</surname> <given-names>KR</given-names>
</name>
</person-group>. <article-title>Diabetic kidney disease: challenges, progress, and possibilities</article-title>. <source>Clin J Am Soc Nephrol</source>. (<year>2017</year>) <volume>12</volume>:<page-range>2032&#x2013;45</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.2215/cjn.11491116</pub-id>
</citation>
</ref>
<ref id="B82">
<label>82</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pugliese</surname> <given-names>G</given-names>
</name>
<name>
<surname>Penno</surname> <given-names>G</given-names>
</name>
<name>
<surname>Natali</surname> <given-names>A</given-names>
</name>
<name>
<surname>Barutta</surname> <given-names>F</given-names>
</name>
<name>
<surname>Di Paolo</surname> <given-names>S</given-names>
</name>
<name>
<surname>Reboldi</surname> <given-names>G</given-names>
</name>
<etal/>
</person-group>. <article-title>Diabetic kidney disease: New clinical and therapeutic issues. Joint position statement of the Italian Diabetes Society and the Italian Society of Nephrology on "The natural history of diabetic kidney disease and treatment of hyperglycemia in patients with type 2 diabetes and impaired renal function</article-title>. <source>Nutr Metab Cardiovasc Dis</source>. (<year>2019</year>) <volume>29</volume>:<page-range>1127&#x2013;50</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.numecd.2019.07.017</pub-id>
</citation>
</ref>
<ref id="B83">
<label>83</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname> <given-names>G</given-names>
</name>
<name>
<surname>Ouyang</surname> <given-names>J</given-names>
</name>
<name>
<surname>Li</surname> <given-names>S</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>H</given-names>
</name>
<name>
<surname>Lian</surname> <given-names>B</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>Z</given-names>
</name>
<etal/>
</person-group>. <article-title>The analysis of risk factors for diabetic nephropathy progression and the construction of a prognostic database for chronic kidney diseases</article-title>. <source>J Transl Med</source>. (<year>2019</year>) <volume>17</volume>:<fpage>264</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s12967-019-2016-y</pub-id>
</citation>
</ref>
<ref id="B84">
<label>84</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Siddiqui</surname> <given-names>K</given-names>
</name>
<name>
<surname>George</surname> <given-names>TP</given-names>
</name>
<name>
<surname>Joy</surname> <given-names>SS</given-names>
</name>
<name>
<surname>Alfadda</surname> <given-names>AA</given-names>
</name>
</person-group>. <article-title>Risk factors of chronic kidney disease among type 2 diabetic patients with longer duration of diabetes</article-title>. <source>Front Endocrinol (Lausanne)</source>. (<year>2022</year>) <volume>13</volume>:<elocation-id>1079725</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fendo.2022.1079725</pub-id>
</citation>
</ref>
<ref id="B85">
<label>85</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jha</surname> <given-names>R</given-names>
</name>
<name>
<surname>Lopez-Trevino</surname> <given-names>S</given-names>
</name>
<name>
<surname>Kankanamalage</surname> <given-names>HR</given-names>
</name>
<name>
<surname>Jha</surname> <given-names>JC</given-names>
</name>
</person-group>. <article-title>Diabetes and renal complications: an overview on pathophysiology, biomarkers and therapeutic interventions</article-title>. <source>Biomedicines</source>. (<year>2024</year>) <volume>12</volume>:<fpage>1098</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/biomedicines12051098</pub-id>
</citation>
</ref>
</ref-list>
</back>
</article>