<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Archiving and Interchange DTD v2.3 20070202//EN" "archivearticle.dtd">
<article xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="methods-article">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Med.</journal-id>
<journal-title>Frontiers in Medicine</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Med.</abbrev-journal-title>
<issn pub-type="epub">2296-858X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fmed.2025.1657889</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Medicine</subject>
<subj-group>
<subject>Methods</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Integrating convolutional neural networks with ensemble methods for enhanced diabetes diagnosis: a multi-dataset evaluation</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name><surname>Zhuang</surname> <given-names>Kaibo</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Zhang</surname> <given-names>Chenyang</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Chen</surname> <given-names>Zhen</given-names></name>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/3186481/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>She</surname> <given-names>Tianyu</given-names></name>
<xref ref-type="aff" rid="aff5"><sup>5</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>&#x002A;</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Wang</surname> <given-names>Min</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="corresp" rid="c002"><sup>&#x002A;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/3119470/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
</contrib-group>
<aff id="aff1"><sup>1</sup><institution>Department of Materials, University of Manchester</institution>, <addr-line>Manchester</addr-line>, <country>United Kingdom</country></aff>
<aff id="aff2"><sup>2</sup><institution>Department of Oncology, The Second Affiliated Hospital of Chengdu Medical College, Nuclear Industry 416 Hospital</institution>, <addr-line>Chengdu</addr-line>, <country>China</country></aff>
<aff id="aff3"><sup>3</sup><institution>The Business School at CU Denver, Public University in Denver</institution>, <addr-line>Denver, CO</addr-line>, <country>United States</country></aff>
<aff id="aff4"><sup>4</sup><institution>Suzhou Medical College, Cancer Institute, Soochow University</institution>, <addr-line>Suzhou</addr-line>, <country>China</country></aff>
<aff id="aff5"><sup>5</sup><institution>Department of Medical Imaging Function, Xi&#x2019;an Electric Power Central Hospital</institution>, <addr-line>Xi&#x2019;an</addr-line>, <country>China</country></aff>
<author-notes>
<fn fn-type="edited-by"><p>Edited by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1640296/overview">Alwin Poulose</ext-link>, Indian Institute of Science Education and Research Thiruvananthapuram, India</p></fn>
<fn fn-type="edited-by"><p>Reviewed by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1009319/overview">Salvatore Corrao</ext-link>, University of Palermo, Italy</p>
<p><ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1776486/overview">Ajay Kumar</ext-link>, University of Petroleum and Energy Studies, India</p></fn>
<corresp id="c001">&#x002A;Correspondence: Tianyu She, <email>2158956264@qq.com</email></corresp>
<corresp id="c002">Min Wang, <email>minwang202005@163.com</email></corresp>
</author-notes>
<pub-date pub-type="epub">
<day>30</day>
<month>09</month>
<year>2025</year>
</pub-date>
<pub-date pub-type="collection">
<year>2025</year>
</pub-date>
<volume>12</volume>
<elocation-id>1657889</elocation-id>
<history>
<date date-type="received">
<day>02</day>
<month>07</month>
<year>2025</year>
</date>
<date date-type="accepted">
<day>30</day>
<month>08</month>
<year>2025</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x00A9; 2025 Zhuang, Zhang, Chen, She and Wang.</copyright-statement>
<copyright-year>2025</copyright-year>
<copyright-holder>Zhuang, Zhang, Chen, She and Wang</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p></license>
</permissions>
<abstract>
<sec>
<title>Introduction</title>
<p>Timely and accurate diagnosis of diabetes mellitus remains a pending challenge due to the diversity of patient data and the limitations of traditional screening methods.</p>
</sec>
<sec>
<title>Objective</title>
<p>To propose a hybrid prediction framework incorporating Convolutional Neural Networks (CNNs) and Integrated Learning with a soft voting strategy to improve the accuracy, robustness and interpretability of diabetes diagnosis.</p>
</sec>
<sec>
<title>Methods</title>
<p>The model was evaluated on two publicly available datasets&#x2014;the UCI Pima Indians Diabetes dataset (768 samples, 8 features), the same dataset used to describe the Pima Indians (2,000 samples, 8 features) and the Tianchi Medical dataset (5,642 samples, 41 features). After missing-value imputation, z-score standardization, and min&#x2013;max normalization, CNNs were used for deep feature extraction, followed by integration with multiple classifiers&#x2014;Logistic Regression (LR), Support Vector Machines (SVM), Random Forest, AdaBoost, XGBoost, LightGBM, and CatBoost&#x2014;via a weighted soft voting scheme. Training and testing sets were split 75:25, and hyperparameters for each classifier were tuned through grid search.</p>
</sec>
<sec>
<title>Results</title>
<p>The proposed CNN-Voting integrated model consistently outperforms the individual models, achieving up to 98% accuracy, 0.99 F1 value and 99% recall on the largest dataset. Feature importance analysis revealed that blood glucose, body mass index (BMI), age, and urea were the features with the most predictive value, which was highly consistent with common knowledge in clinical medicine.</p>
</sec>
<sec>
<title>Conclusion</title>
<p>This hybrid model not only improves predictive performance and generalisability, but also provides a scalable and interpretable solution for clinical decision support in diabetes management.</p>
</sec>
</abstract>
<kwd-group>
<kwd>convolutional neural networks</kwd>
<kwd>diabetes</kwd>
<kwd>soft voting</kwd>
<kwd>machine learning</kwd>
<kwd>feature extraction</kwd>
</kwd-group>
<counts>
<fig-count count="5"/>
<table-count count="9"/>
<equation-count count="14"/>
<ref-count count="59"/>
<page-count count="16"/>
<word-count count="10672"/>
</counts>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Precision Medicine</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec id="S1" sec-type="intro">
<title>1 Introduction</title>
<p>Diabetes Mellitus (DM) is a chronic metabolic disease characterized by hyperglycaemia (high blood sugar), primarily due to insufficient insulin secretion or insulin resistance (<xref ref-type="bibr" rid="B1">1</xref>). According to the International Diabetes Federation (IDF) in 2021, there were approximately 537 million people living with diabetes globally, which is expected to grow to 783 million by 2,045 (<xref ref-type="bibr" rid="B2">2</xref>). To make matters worse, complications caused by diabetes affect many vital organs, leading to irreversible damage such as blindness, kidney failure, cardiovascular disease, and neuropathy (<xref ref-type="bibr" rid="B3">3</xref>&#x2013;<xref ref-type="bibr" rid="B5">5</xref>). Globally, 450 million people are in the pre-diabetic stage of the disease, of which 70 per cent may develop diabetes in the future. However, about 50 per cent of patients with type 2 pre-diabetes can be prevented from developing diabetes through appropriate lifestyle interventions, exercise and dietary control (<xref ref-type="bibr" rid="B6">6</xref>). At the same time, diabetes is highly insidious, and there may be no obvious symptoms in the early stages. According to statistics, more than 50% of patients with type 2 diabetes have already demonstrated diabetic complications at the time of diagnosis. Current traditional screening methods for diabetes still have limitations such as relying on fasting blood glucose, OGTT or HbA1c, resulting in high testing costs, and some patients, even with normal blood glucose levels, may still go undiagnosed due to insulin resistance or other metabolic abnormalities (<xref ref-type="bibr" rid="B7">7</xref>, <xref ref-type="bibr" rid="B8">8</xref>). In recent years, machine learning has shown great potential in the field of medical prediction, aiming to help clinicians be able to make fast and accurate clinical predictions at an early stage, but the results of modeling using common machine learning models are not satisfactory. Deberneh and Kim developed a machine learning model to predict diabetes using a process consisting of ANOVA, Chi-Squared Test, and Recursive Feature Elimination (RFE) to select key features (<xref ref-type="bibr" rid="B9">9</xref>). Prediction performance was evaluated using traditional machine learning models and integrated learning for the 12 feature sets selected versus the traditional 5 feature sets (FPG, HbA1c, BMI, age, and gender), respectively, but the integrated learning approach outperformed the single model in cross-validation, with a limited improvement in overall accuracy of 73%. In Olisah et al.&#x2019;s study on predicting diabetes, a machine learning framework was proposed that used Spearman Correlation (SC) to select relevant features and Polynomial Regression (PR) to fill in missing values during the data preprocessing stage (<xref ref-type="bibr" rid="B10">10</xref>). They used Support Vector Machine (SVM), Random Forest (RF) and Twice-Growth Deep Neural Network (2GDNN) for prediction, and obtained a significant improvement in the performance of the model after SC and PR optimisation. The optimized 2GDNN achieved better accuracy than the traditional SVM. However, the feature selection method chosen by Olisah et al. has limitations although it improves the model performance to some extent. Firstly, Spearman correlation can only measure univariate relationships and cannot capture the interaction between features, which may lead to the omission of key variables.</p>
<p>In addition, one-hot encoding leads to data dimensionality inflation, which affects computational efficiency (<xref ref-type="bibr" rid="B11">11</xref>, <xref ref-type="bibr" rid="B12">12</xref>). In contrast, CNN can automatically extract deep features and avoid the limitation of manual feature selection, thus learning trends in patients&#x2019; conditions more comprehensively. Dinh et al. proposed a data-driven machine learning approach based on the prediction of diabetes and Cardiovascular Disease (CVD). They not only used traditional machine learning models SVM and LR, but also added RF, extreme Gradient Boosting (XGBoost), and Weighted Ensemble Model (WEM) in integrated learning to improve the prediction ability, and the results showed that XGBoost performed the best in the prediction (diabetes AUC = 95.7%, CVD AUC = 83.9%) (<xref ref-type="bibr" rid="B13">13</xref>). However, existing research approaches typically train machine learning models and deep learning models independently &#x201C;end-to-end&#x201D; and lack the fusion of the two, which may limit the generalization ability and robustness of the models. Therefore, we propose a hybrid model that combines multiple machine learning algorithms and convolutional neural networks (CNNs) with the aim of improving the performance of diabetes prediction. Our approach leverages the strengths of both traditional machine learning algorithms and deep learning techniques by integrating them to achieve more accurate predictions.</p>
<p>In this study, we propose an innovative hybrid modeling strategy. The model first uses a convolutional neural network (CNN) for deep extraction of data features to mine potential patterns associated with diabetes, which avoids human interference with feature weights. Subsequently, for the high-dimensional features extracted by the fully connected layer of the CNN, we weight the outputs by an integrated learning approach that combines multiple classical machine learning algorithms via a soft voting strategy. This fusion strategy of convolutional neural network to extract important features and soft-voting integration method for prediction effectively integrates and leverages the advantages of each model, improving the accuracy and robustness of prediction.</p>
</sec>
<sec id="S2">
<title>2 Datasets</title>
<sec id="S2.SS1">
<title>2.1 Source of the datasets</title>
<p>In our study, we evaluated the performance of different machine learning models and ensemble learning methods in a diabetes prediction task through a series of experiments. We selected three datasets with varying feature distributions and sample sizes to ensure the reliability and generalizability of the results. Datasets 1 and 2 are 769 data containing 8 features for Pima Indians from the University of California, Irvine (UCI) machine learning database and 2,000 data containing 8 features for Pima Indians, which is available at <ext-link ext-link-type="uri" xlink:href="https://archive.ics.uci.edu/">https://archive.ics.uci.edu/</ext-link>. This database is often used for benchmarking purposes in diabetes prediction studies due to its standardized format, however the two datasets differed in sample size, which allowed us to observe how model performance varied with increasing data size. Dataset 3 is derived from the preliminary dataset of &#x201C;Tianchi Precision Medicine Competition - Artificial Intelligence-assisted Diabetes Genetic Risk Prediction&#x201D; organized by Aliyun Tianchi Platform (<xref ref-type="table" rid="T1">Table 1</xref>). This dataset is designed to predict blood glucose concentration from the physical examination indicators of diabetic patients, and contains 5,642 data items, each of which has 41 features. The dataset covers a wide range of laboratory and physiological indicators associated with diabetes, enhancing clinical applicability and characterisation diversity.</p>
<table-wrap position="float" id="T1">
<label>TABLE 1</label>
<caption><p>Dataset summary.</p></caption>
<table cellspacing="5" cellpadding="5" frame="box" rules="all">
<thead>
<tr>
<td valign="top" align="center">Dataset</td>
<td valign="top" align="center">Features</td>
<td valign="top" align="center">Total samples</td>
<td valign="top" align="center">Positive samples</td>
<td valign="top" align="center">Negative samples</td>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="center">1</td>
<td valign="top" align="center">8</td>
<td valign="top" align="center">769</td>
<td valign="top" align="center">269</td>
<td valign="top" align="center">500</td>
</tr>
<tr>
<td valign="top" align="center">2</td>
<td valign="top" align="center">8</td>
<td valign="top" align="center">2,000</td>
<td valign="top" align="center">1,316</td>
<td valign="top" align="center">684</td>
</tr>
<tr>
<td valign="top" align="center">3</td>
<td valign="top" align="center">41</td>
<td valign="top" align="center">5,642</td>
<td valign="top" align="center">2,832</td>
<td valign="top" align="center">2,792</td>
</tr>
</tbody>
</table></table-wrap>
<p>Together, these datasets are able to provide a comprehensive assessment for different sample sizes, feature complexity. However, there are some limitations. For example, datasets 1 and 2 contain only eight features, which may not adequately reflect the multidimensional nature of diabetes. In addition, these datasets may not be representative of broader ethnic or geographic diversity beyond the Pima Indian population. Dataset 3, although larger and richer, lacks detailed patient background and clinical context information, which may limit the interpretability of some features. Despite these limitations, the combination of these datasets provides a solid framework for evaluating the scalability and adaptability of the proposed hybrid model under varying data complexity.</p>
</sec>
<sec id="S2.SS2">
<title>2.2 Preprocessing</title>
<p>In this study, to improve the performance of the diabetes prediction model, we applied several data preprocessing techniques, including missing value imputation, feature normalization, and standardization. Given that certain features in the dataset contain missing values, we adopted mean imputation for numerical features, where missing entries were replaced with the mean of the corresponding feature. For categorical variables, the mode imputation method was used, substituting missing values with the most frequent category. The standardization process was conducted using <xref ref-type="disp-formula" rid="E1">Equation 1</xref>:</p>
<disp-formula id="E1">
<label>(1)</label>
<mml:math id="M1">
<mml:mrow>
<mml:mpadded width="+3.3pt">
<mml:msub>
<mml:mi>X</mml:mi>
<mml:mrow>
<mml:mtext>scaled</mml:mtext>
</mml:mrow>
</mml:msub>
</mml:mpadded>
<mml:mo rspace="5.8pt">=</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mpadded width="+3.3pt">
<mml:mi>X</mml:mi>
</mml:mpadded>
<mml:mo rspace="5.8pt">-</mml:mo>
<mml:mrow>
<mml:mi>&#x03BC;</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mi>X</mml:mi>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:mrow>
<mml:mrow>
<mml:mi>&#x03C3;</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mi>X</mml:mi>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
</disp-formula>
<p>Each feature was transformed to have a mean of 0 and a standard deviation of 1 to eliminate the scale differences among features. Specifically, let <italic>X</italic> denote the original feature vector, &#x03BC;(<italic>X</italic>) its mean, and &#x03C3;(<italic>X</italic>) its standard deviation (<xref ref-type="bibr" rid="B14">14</xref>). This standardization step ensures that the data follows a standard normal distribution. Subsequently, the standardized data was normalized using <xref ref-type="disp-formula" rid="E2">Equation 2</xref>:</p>
<disp-formula id="E2">
<label>(2)</label>
<mml:math id="M2">
<mml:mrow>
<mml:mpadded width="+3.3pt">
<mml:msub>
<mml:mi>X</mml:mi>
<mml:mrow>
<mml:mi>s</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>c</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>a</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>l</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>e</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:msup>
<mml:mi>d</mml:mi>
<mml:mo>&#x2032;</mml:mo>
</mml:msup>
</mml:mrow>
</mml:msub>
</mml:mpadded>
<mml:mo rspace="5.8pt">=</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mi>X</mml:mi>
<mml:mo>-</mml:mo>
<mml:msub>
<mml:mi>X</mml:mi>
<mml:mrow>
<mml:mi>m</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>i</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>n</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mi>X</mml:mi>
<mml:mrow>
<mml:mi>m</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>a</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>x</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>-</mml:mo>
<mml:msub>
<mml:mi>X</mml:mi>
<mml:mrow>
<mml:mi>m</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>i</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>n</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
</disp-formula>
<p>The aim is to scale the data to be in the interval [0,1], which helps in better training of some models that require input values in a specific range where <italic>X</italic><sub><italic>min</italic></sub> is the minimum value of the feature vector and <italic>X</italic><sub><italic>max</italic></sub> is the maximum value of the feature vector (<xref ref-type="bibr" rid="B15">15</xref>).</p>
<p>In this study, diabetes-related features were used as independent variables, and diabetes status (presence or absence of the disease) served as the dependent variable. The presence or absence of diabetes is coded using binary values where 0 represents non-diabetes and 1 represents having diabetes. In many machine learning tasks, class imbalance between positive and negative samples often leads to severe model overfitting and biased predictions. To address this issue, our study incorporated the Synthetic Minority Oversampling Technique (SMOTE), which generates synthetic samples for the minority class by interpolating between existing minority instances in feature space, thereby balancing the class distribution and improving model generalization (<xref ref-type="bibr" rid="B16">16</xref>). To train the dataset, the samples were divided into 75% training set over 25% testing set. As described earlier, traditional machine learning algorithms, ensemble methods, and hybrid CNN-based models were trained on the training set. The test set was then used to evaluate the performance of each model.</p>
</sec>
</sec>
<sec id="S3">
<title>3 Modeling and evaluation</title>
<p>In this study, we propose a hybrid model that combines multiple machine learning algorithms and convolutional neural networks (CNNs) with the aim of improving the performance of diabetes prediction. Our approach leverages the strengths of both traditional machine learning algorithms and deep learning techniques by integrating them to achieve more accurate predictions. The schematic diagram of the innovative model architecture is shown in <xref ref-type="fig" rid="F1">Figure 1</xref>.</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption><p>Architecture flow of diabetes prediction model.</p></caption>
<alt-text>Flowchart illustrating a machine learning workflow. It begins with three datasets undergoing data pre-processing and segmentation into 75% training and 25% testing. The training data proceeds to feature extraction using convolutional layers, fully connected layers, and embedding. Both direct input and extracted features are fed into models: LR, SVM, RF, AdaBoost, XGBoost, LightGBM, CatBoost, and Voting. Each model outputs results. The process emphasizes model training and testing to generate final outputs.</alt-text>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmed-12-1657889-g001.tif"/>
</fig>
<sec id="S3.SS1">
<title>3.1 Traditional machine learning models</title>
<p>After data preprocessing, we employed several traditional machine learning algorithms for diabetes prediction, including logistic regression (LR), support vector machines (SVM), and decision trees (DT). These models were trained using standard classification procedures, including feature engineering and hyperparameter tuning. Logistic regression (LR) is one of the most common methods used for binary classification problems in healthcare prediction (<xref ref-type="bibr" rid="B17">17</xref>&#x2013;<xref ref-type="bibr" rid="B19">19</xref>). It predicts the probability that an instance belongs to a binary classification by linearly combining the input features (<xref ref-type="bibr" rid="B20">20</xref>), and this prediction is modeled as <xref ref-type="disp-formula" rid="E3">Equation 3</xref>:</p>
<disp-formula id="E3">
<label>(3)</label>
<mml:math id="M3">
<mml:mrow>
<mml:mi>P</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mpadded width="+3.3pt">
<mml:mi>Y</mml:mi>
</mml:mpadded>
<mml:mo rspace="5.8pt">=</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo>|</mml:mo>
<mml:mi>X</mml:mi>
<mml:mo rspace="9.1pt">)</mml:mo>
</mml:mrow>
<mml:mfrac>
<mml:mn>1</mml:mn>
<mml:mrow>
<mml:mn>1</mml:mn>
<mml:mo>+</mml:mo>
<mml:msup>
<mml:mi>e</mml:mi>
<mml:mrow>
<mml:mo>-</mml:mo>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mrow>
<mml:mi>w</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>X</mml:mi>
</mml:mrow>
<mml:mo>+</mml:mo>
<mml:mi>b</mml:mi>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
</disp-formula>
<p>where w denotes the feature weight coefficients and b is the bias term. Support vector machines are supervised learning algorithms for linear or nonlinear classification tasks in medical prediction, aiming at trying to find an optimal hyperplane that maximizes the interval between different classes (<xref ref-type="bibr" rid="B21">21</xref>&#x2013;<xref ref-type="bibr" rid="B24">24</xref>). Its decision function <xref ref-type="disp-formula" rid="E4">Equation 4</xref> is defined as:</p>
<disp-formula id="E4">
<label>(4)</label>
<mml:math id="M4">
<mml:mrow>
<mml:mrow>
<mml:mi>f</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mi>x</mml:mi>
<mml:mo rspace="5.8pt">)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mo rspace="5.8pt">=</mml:mo>
<mml:mrow>
<mml:mi>s</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>i</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>g</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>n</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mrow>
<mml:mi>w</mml:mi>
<mml:mo>&#x22C5;</mml:mo>
<mml:mi>x</mml:mi>
</mml:mrow>
<mml:mo>+</mml:mo>
<mml:mi>b</mml:mi>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:mrow>
</mml:math>
</disp-formula>
<p>where w is the normal vector of the hyperplane and b is the bias term. Decision tree is a versatile supervised learning algorithm for regression and classification tasks (<xref ref-type="bibr" rid="B25">25</xref>, <xref ref-type="bibr" rid="B26">26</xref>). It constructs a tree-like decision structure by dividing the training set, and it is also a basic component of the random forest algorithm (<xref ref-type="bibr" rid="B25">25</xref>). The feature selection criterion in its classification problem is based on the Gini index, the smaller the Gini index the better the classification effect, which is calculated by the <xref ref-type="disp-formula" rid="E5">Equation 5</xref>:</p>
<disp-formula id="E5">
<label>(5)</label>
<mml:math id="M5"><mml:mrow><mml:mi>G</mml:mi><mml:mi>i</mml:mi><mml:mi>n</mml:mi><mml:mi>i</mml:mi><mml:mtext>&#x2009;</mml:mtext><mml:mo stretchy='false'>(</mml:mo><mml:mi>D</mml:mi><mml:mo stretchy='false'>)</mml:mo><mml:mo>=</mml:mo><mml:mn>1</mml:mn><mml:mo>&#x2212;</mml:mo><mml:mstyle displaystyle='true'><mml:munderover><mml:mo>&#x2211;</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>c</mml:mi></mml:munderover><mml:mrow><mml:msubsup><mml:mi>p</mml:mi><mml:mi>i</mml:mi><mml:mn>2</mml:mn></mml:msubsup></mml:mrow></mml:mstyle></mml:mrow></mml:math>
</disp-formula>
<p>where p<sub><italic>i</italic></sub> represents the proportion of samples belonging to category, i.</p>
<p>In diabetes prediction modeling, feature screening is an important step to improve model performance, reduce complexity and enhance interpretability (<xref ref-type="bibr" rid="B27">27</xref>&#x2013;<xref ref-type="bibr" rid="B29">29</xref>). Feature screening helps to improve the prediction performance because not all features contribute equally to the prediction of diabetes. By removing features that contribute less to model performance, noise and redundant information can be reduced, allowing the model to focus more on the most informative features, thus improving prediction accuracy (<xref ref-type="bibr" rid="B30">30</xref>). In addition the model structure can be simplified and reduced in complexity by reducing unnecessary input variables, thereby reducing the risk of overfitting and improving the model&#x2019;s ability to generalize (<xref ref-type="bibr" rid="B31">31</xref>). Feature screening also enhances the interpretability of the model, helping researchers to understand the extent to which the model relies on different features to identify the biomarkers, physiological indicators, or risk factors that are most critical to diabetes development and risk assessment. Feature screening optimizes data collection and cost-effectiveness by reducing the cost and effort of data collection by screening the most representative features, making data collection more efficient and targeted. Therefore, we produced a correlation heat map and feature weighting table by calculating the Pearson correlation coefficient, which helps to assess whether there is feature redundancy or information loss in the model. Reasonable feature screening not only improves the performance of diabetes prediction models, but also enhances their clinical applicability, providing a more reliable basis for disease screening and personalized medicine.</p>
</sec>
<sec id="S3.SS2">
<title>3.2 Integrated learning methods</title>
<p>To improve prediction performance, we employed ensemble learning methods. Integrated learning is mainly based on two strategies, Bagging and Boosting, which can reduce the bias and variance of a single model by combining the prediction results of multiple base learners, thus improving the overall performance (<xref ref-type="bibr" rid="B32">32</xref>, <xref ref-type="bibr" rid="B33">33</xref>). Random Forest is an integrated learning method based on the Bagging strategy that uses multiple decision trees integrated for voting to accomplish the classification task (<xref ref-type="bibr" rid="B34">34</xref>). In addition, we also compare integrated learning methods based on Boosting such as AdaBoost, XGBoost, LightGBM, and CatBoost methods. AdaBoost iteratively trains weak learners, assigning higher weights to misclassified samples, so that the subsequent learners will pay more attention to misclassified samples and reclassify them, and the final model prediction XGBoost is based on the gradient boosting method, which optimizes the information of the second-order derivatives to complete the training of the model and improve the computational accuracy and efficiency. LightGBM is considered to be the optimized version of XGBoost, which adopts the leaf-wise growth strategy to speed up the computation and is more suitable for large datasets, and has a more accurate prediction of the category features. It has more accurate prediction of category features. CatBoost is an optimized gradient boosting algorithm tailored for categorical features, capable of automatically handling categorical variables, making it particularly suitable for tasks with a high proportion of such features (<xref ref-type="bibr" rid="B33">33</xref>, <xref ref-type="bibr" rid="B35">35</xref>&#x2013;<xref ref-type="bibr" rid="B37">37</xref>).</p>
<p>To integrate the prediction results of multiple models, this study adopted a soft voting ensemble learning method. In soft voting ensemble learning, the ensemble model generates the final category probability value by weighting the prediction probabilities of multiple base learners (<xref ref-type="bibr" rid="B38">38</xref>, <xref ref-type="bibr" rid="B39">39</xref>). The advantages of ensemble learning lie in the fact that different models perform differently under different data distributions, and soft voting can balance the performance of each model while fully leveraging their respective strengths.</p>
<p>Specifically, suppose there are M base learners <inline-formula><mml:math id="INEQ3"><mml:mrow><mml:msubsup><mml:mrow><mml:mo stretchy="false">{</mml:mo><mml:msub><mml:mi>f</mml:mi><mml:mi>m</mml:mi></mml:msub><mml:mo stretchy="false">}</mml:mo></mml:mrow><mml:mrow><mml:mpadded width="+6.6pt"><mml:mi>m</mml:mi></mml:mpadded><mml:mo>&#x2062;</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>M</mml:mi></mml:msubsup><mml:mo>,</mml:mo></mml:mrow></mml:math></inline-formula>and each base learner f<sub><italic>m</italic></sub> outputs the probability that a sample x belongs to the positive class (y = 1) as <inline-formula><mml:math id="INEQ4"><mml:mrow><mml:mover accent="true"><mml:msub><mml:mi>p</mml:mi><mml:mi>m</mml:mi></mml:msub><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mo>(</mml:mo><mml:mpadded width="+6.6pt"><mml:mi>y</mml:mi></mml:mpadded><mml:mn>1</mml:mn><mml:mo>|</mml:mo><mml:mi>x</mml:mi><mml:mo>)</mml:mo></mml:mrow></mml:mrow></mml:math></inline-formula>. The weighted ensemble prediction can be expressed as the <xref ref-type="disp-formula" rid="E6">Equation 6</xref>:</p>
<disp-formula id="E6">
<label>(6)</label>
<mml:math id="M6"><mml:mrow><mml:mover accent='true'><mml:mi>p</mml:mi><mml:mo>&#x005E;</mml:mo></mml:mover><mml:mtext>&#x2009;</mml:mtext><mml:mo stretchy='false'>(</mml:mo><mml:mi>y</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn><mml:mo stretchy='false'>&#x007C;</mml:mo><mml:mi>x</mml:mi><mml:mo stretchy='false'>)</mml:mo><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mstyle displaystyle='true'><mml:msubsup><mml:mo>&#x2211;</mml:mo><mml:mrow><mml:mi>m</mml:mi><mml:mtext>&#x2009;</mml:mtext><mml:mo>=</mml:mo><mml:mtext>&#x2009;</mml:mtext><mml:mn>1</mml:mn></mml:mrow><mml:mi>M</mml:mi></mml:msubsup><mml:mrow><mml:msub><mml:mi>w</mml:mi><mml:mi>m</mml:mi></mml:msub><mml:mover accent='true'><mml:mrow><mml:msub><mml:mi>p</mml:mi><mml:mi>m</mml:mi></mml:msub></mml:mrow><mml:mo stretchy='true'>&#x005E;</mml:mo></mml:mover><mml:mrow><mml:mo>(</mml:mo><mml:mrow><mml:mo>&#x007C;</mml:mo><mml:mi>y</mml:mi><mml:mtext>&#x2009;</mml:mtext><mml:mo>=</mml:mo><mml:mtext>&#x2009;</mml:mtext><mml:mn>1</mml:mn><mml:mo>&#x007C;</mml:mo><mml:mi>x</mml:mi></mml:mrow><mml:mo>)</mml:mo></mml:mrow></mml:mrow></mml:mstyle></mml:mrow><mml:mrow><mml:mstyle displaystyle='true'><mml:msubsup><mml:mo>&#x2211;</mml:mo><mml:mrow><mml:mi>m</mml:mi><mml:mtext>&#x2009;</mml:mtext><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>M</mml:mi></mml:msubsup><mml:mrow><mml:msub><mml:mi>w</mml:mi><mml:mi>m</mml:mi></mml:msub></mml:mrow></mml:mstyle></mml:mrow></mml:mfrac></mml:mrow></mml:math></disp-formula>
<p>where <italic>w<sub>m</sub></italic> denotes the weight assigned to the m-th base learner, representing its relative importance in the ensemble model.</p>
<p>Secondly, by integrating multiple models, the method is able to reduce the dependence on a single model, which improves the generalization ability and reduces the risk of overfitting. In addition, by integrating the prediction results of multiple models, the soft voting method can improve the prediction accuracy and provide more reliable prediction results.</p>
<p>For the weight allocation of each base learner in soft voting integration, we choose to use an accuracy-based weighting method. The accuracy A<sub><italic>m</italic></sub> of each base learner f<sub><italic>m</italic></sub> is calculated on the validation set D<sub><italic>val</italic></sub>, as the <xref ref-type="disp-formula" rid="E7">Equation 7</xref>:</p>
<disp-formula id="E7">
<label>(7)</label>
<mml:math id="M7">
<mml:mrow>
<mml:mpadded width="+6.6pt">
<mml:msub>
<mml:mi>A</mml:mi>
<mml:mi>m</mml:mi>
</mml:msub>
</mml:mpadded>
<mml:mo>&#x2062;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mpadded width="+5pt">
<mml:mi>Number</mml:mi>
</mml:mpadded>
<mml:mo>&#x2062;</mml:mo>
<mml:mpadded width="+5pt">
<mml:mi>of</mml:mi>
</mml:mpadded>
<mml:mo>&#x2062;</mml:mo>
<mml:mpadded width="+5pt">
<mml:mi>correctly</mml:mi>
</mml:mpadded>
<mml:mo>&#x2062;</mml:mo>
<mml:mpadded width="+5pt">
<mml:mi>classified</mml:mi>
</mml:mpadded>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>samples</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mpadded width="+5pt">
<mml:mi>Total</mml:mi>
</mml:mpadded>
<mml:mo>&#x2062;</mml:mo>
<mml:mpadded width="+5pt">
<mml:mi>number</mml:mi>
</mml:mpadded>
<mml:mo>&#x2062;</mml:mo>
<mml:mpadded width="+5pt">
<mml:mi>of</mml:mi>
</mml:mpadded>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>samples</mml:mi>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
</disp-formula>
<p>Based on the accuracy of each base learner, the weight w is proportional to its accuracy A on the validation set. To ensure that the sum of all base learners&#x2019; weights equals 1, the weight terms are normalized, which is calculated by the <xref ref-type="disp-formula" rid="E8">Equation 8</xref>. This ensures that models with higher accuracy contribute more weight in the voting process, while those with lower accuracy contribute less weight.</p>
<disp-formula id="E8">
<label>(8)</label>
<mml:math id="M8"><mml:mtable><mml:mtr><mml:mtd><mml:msub><mml:mi>w</mml:mi><mml:mi>m</mml:mi></mml:msub><mml:mo>=</mml:mo><mml:msub><mml:mi>A</mml:mi><mml:mi>m</mml:mi></mml:msub></mml:mtd></mml:mtr><mml:mtr><mml:mtd><mml:msub><mml:mi>w</mml:mi><mml:mi>m</mml:mi></mml:msub><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:msub><mml:mi>A</mml:mi><mml:mi>m</mml:mi></mml:msub></mml:mrow><mml:mrow><mml:mstyle displaystyle='true'><mml:msubsup><mml:mo>&#x2211;</mml:mo><mml:mrow><mml:mi>m</mml:mi><mml:mtext>&#x2009;</mml:mtext><mml:mo>=</mml:mo><mml:mtext>&#x2009;</mml:mtext><mml:mn>1</mml:mn></mml:mrow><mml:mi>M</mml:mi></mml:msubsup><mml:mrow><mml:msub><mml:mi>A</mml:mi><mml:mi>m</mml:mi></mml:msub></mml:mrow></mml:mstyle></mml:mrow></mml:mfrac></mml:mtd></mml:mtr></mml:mtable></mml:math></disp-formula>
<p>In this study, the use of soft-voting integrated learning can fully utilize the prediction ability of multiple models, thus improving the accuracy and robustness of diabetes prediction.</p>
</sec>
<sec id="S3.SS3">
<title>3.3 Convolutional neural network</title>
<p>To leverage the strengths of deep learning, we designed a Convolutional Neural Network (CNN) model for structural feature extraction. CNNs have demonstrated exceptional performance in image and sequential data processing due to their ability to capture both local and global patterns (<xref ref-type="bibr" rid="B40">40</xref>, <xref ref-type="bibr" rid="B41">41</xref>). In our study, the CNN architecture consists of convolutional layers that extract local structural features via convolution operations, pooling layers that reduce feature dimensionality while preserving salient information, and fully connected layers that project the learned features into the prediction space. The features extracted from the final CNN layer provides a rich, high-level feature representation, capable of capturing complex patterns that are often difficult for traditional machine learning algorithms to detect.</p>
<p>Specifically, the convolutional neural network (CNN) architecture consists of two convolutional layers (conv1 and conv2), two fully connected layers (fc1 and fc2), and an output layer (fc3). The rectified linear unit (ReLU) activation function is used in each layer to accelerate convergence and mitigate the vanishing gradient problem. After each convolutional layer and fully connected layer, the ReLU activation function is applied to the output to help the model learn more complex features. To ensure optimal model performance, several key hyperparameters were carefully tuned during training. The study used the adaptive learning rate optimiser Adam, with an initial learning rate set to 0.001. The Adam optimiser dynamically adjusts the learning rate based on each parameter&#x2019;s update, thereby accelerating the training process and improving stability. To mitigate overfitting, the Dropout technique was used in the CNN model to define the Dropout Rate. After the fully connected layers (fc1 and fc2), the Dropout Rate was set to 0.5. This strategy promotes network robustness by randomly &#x2018;dropping&#x2019; the outputs of some neurons. Additionally, we considered the impact of the number of filters. In the convolutional layers, we used 32 filters (conv1 layer) and 64 filters (conv2 layer). This configuration helps extract features of different scales from the input data. We used two fully connected layers (fc1 and fc2) in the CNN architecture to further process the high-dimensional features extracted by the convolutional layers. The role of these fully connected layers is to map the spatial features extracted by the CNN network to a higher-dimensional feature space, enabling the model to capture more complex patterns. The first fully connected layer, fc1, has an output size of 512 nodes, enabling further feature extraction. The second fully connected layer, fc2, has an output size of 256 nodes, providing a more compact and discriminative feature representation for the final classification task. Using two fully connected layers helps reduce the dimension of features and integrate the deep features extracted by the convolutional layers. This structure aims to enhance the network&#x2019;s ability to recognize complex patterns and provide more precise feature inputs for subsequent soft voting ensemble learning methods. Before performing soft voting ensemble learning, we first extracted deep features from the input data using a CNN, then further processed them through two fully connected layers. Finally, a weighted soft voting strategy was adopted to combine the outputs of multiple classifiers (such as Logistic Regression, SVM, XGBoost, Random Forest, etc.) to obtain the final prediction result. During soft voting, the weights of the models are allocated based on their accuracy on the validation set. Specifically, the output probabilities of each model are weighted averaged to obtain the final classification probability, and the category with the highest probability is selected as the model&#x2019;s prediction result.</p>
</sec>
<sec id="S3.SS4">
<title>3.4 Hybrid model design</title>
<p>To further improve predictive performance, we integrated the features extracted by the CNN with those used in ensemble learning models. This hybrid architecture is referred to as the hybrid CNN-based models. CNN-based models High-level features were first extracted from the dataset using the CNN, and then fused either by concatenation or weighted combination with features derived from conventional machine learning models. The ensemble learning model was then trained on the fused feature set to generate diabetes prediction results. In addition, the fused features were visualized for interpretability.</p>
<p>The key advantage of this hybrid approach lies in the CNN&#x2019;s capability to capture complex and non-linear patterns in the data, thereby complementing the limitations of traditional machine learning methods. As a result, the hybrid model achieves enhanced predictive accuracy, robustness, and generalization performance.</p>
</sec>
<sec id="S3.SS5">
<title>3.5 Evaluation metrics</title>
<p>In machine learning, model performance evaluation is critical. Common evaluation metrics include Accuracy, Recall, F1-score, and the Receiver Operating Characteristic (ROC) curve, which are particularly useful in binary classification tasks (<xref ref-type="bibr" rid="B42">42</xref>).</p>
<p>Accuracy measures the proportion of correctly predicted instances over the total number of samples and is calculated as shown in <xref ref-type="disp-formula" rid="E9">Equation 9</xref>:</p>
<disp-formula id="E9">
<label>(9)</label>
<mml:math id="M9">
<mml:mrow>
<mml:mpadded width="+3.3pt">
<mml:mtext>Accuracy</mml:mtext>
</mml:mpadded>
<mml:mo rspace="5.8pt">=</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>P</mml:mi>
</mml:mrow>
<mml:mo>+</mml:mo>
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>N</mml:mi>
</mml:mrow>
</mml:mrow>
<mml:mrow>
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>P</mml:mi>
</mml:mrow>
<mml:mo>+</mml:mo>
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>N</mml:mi>
</mml:mrow>
<mml:mo>+</mml:mo>
<mml:mrow>
<mml:mi>F</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>P</mml:mi>
</mml:mrow>
<mml:mo>+</mml:mo>
<mml:mrow>
<mml:mi>F</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>N</mml:mi>
</mml:mrow>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
</disp-formula>
<p>Where TP (True Positive) refers to the number of positive samples correctly predicted as positive, TN (True Negative) refers to the number of negative samples correctly predicted as negative, FP (False Positive) refers to the number of negative samples incorrectly predicted as positive, and FN (False Negative) refers to the number of positive samples incorrectly predicted as negative.</p>
<p>Recall (also known as Sensitivity or True Positive Rate) measures the proportion of actual positive cases that are correctly identified by the model. It is calculated as shown in <xref ref-type="disp-formula" rid="E10">Equation 10</xref>:</p>
<disp-formula id="E10">
<label>(10)</label>
<mml:math id="M10">
<mml:mrow>
<mml:mpadded width="+3.3pt">
<mml:mtext>Recall</mml:mtext>
</mml:mpadded>
<mml:mo rspace="5.8pt">=</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>P</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>P</mml:mi>
</mml:mrow>
<mml:mo>+</mml:mo>
<mml:mrow>
<mml:mi>F</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>N</mml:mi>
</mml:mrow>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
</disp-formula>
<p>The F1-score is the harmonic mean of Precision and Recall, and it is used to balance the two metrics. When dealing with imbalanced datasets, the F1-score is considered more reliable than Accuracy, as it takes into account both False Positives (FP) and False Negatives (FN). It is computed as shown in <xref ref-type="disp-formula" rid="E11">Equation 11</xref>:</p>
<disp-formula id="E11">
<label>(11)</label>
<mml:math id="M11">
<mml:mrow>
<mml:mrow>
<mml:mi>F</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mpadded width="+3.3pt">
<mml:mn>1</mml:mn>
</mml:mpadded>
</mml:mrow>
<mml:mo rspace="5.8pt">=</mml:mo>
<mml:mrow>
<mml:mpadded width="+3.3pt">
<mml:mn>2</mml:mn>
</mml:mpadded>
<mml:mo rspace="5.8pt">&#x00D7;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mpadded width="+3.3pt">
<mml:mtext>Precision</mml:mtext>
</mml:mpadded>
<mml:mo rspace="5.8pt">&#x00D7;&#x00A0;</mml:mo>
<mml:mtext>Recall</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mtext>Precision</mml:mtext>
<mml:mo>+</mml:mo>
<mml:mtext>Recall</mml:mtext>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:mrow>
</mml:math>
</disp-formula>
<p>In addition, we also evaluated the stability and statistical reliability of the model results based on accuracy, specificity, and the Matthews Correlation Coefficient (MCC) at a 95% confidence interval.</p>
<p>Precision refers to the proportion of all samples predicted by the model to be in the positive category that are actually in the positive category. <xref ref-type="disp-formula" rid="E12">Equation 12</xref> is calculated as follows:</p>
<disp-formula id="E12">
<label>(12)</label>
<mml:math id="M12">
<mml:mrow>
<mml:mpadded width="+3.3pt">
<mml:mtext>Precision</mml:mtext>
</mml:mpadded>
<mml:mo rspace="5.8pt">=</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>P</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>P</mml:mi>
</mml:mrow>
<mml:mo>+</mml:mo>
<mml:mrow>
<mml:mi>F</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>P</mml:mi>
</mml:mrow>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
</disp-formula>
<p>Specificity, also known as the true negative rate (TNR), measures the proportion of correctly predicted negative cases among all actual negative cases. It is computed as shown in <xref ref-type="disp-formula" rid="E13">Equation 13</xref>:</p>
<disp-formula id="E13">
<label>(13)</label>
<mml:math id="M13">
<mml:mrow>
<mml:mpadded width="+3.3pt">
<mml:mtext>Specificity</mml:mtext>
</mml:mpadded>
<mml:mo rspace="5.8pt">=</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>N</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>N</mml:mi>
</mml:mrow>
<mml:mo>+</mml:mo>
<mml:mrow>
<mml:mi>F</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>P</mml:mi>
</mml:mrow>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
</disp-formula>
<p>The Matthews Correlation Coefficient (MCC) is a balanced metric that measures the quality of binary classifications. MCC returns a value between &#x2212;1 and +1, where +1 indicates perfect prediction, 0 indicates random prediction, and &#x2212;1 indicates complete disagreement between prediction and observation (<xref ref-type="bibr" rid="B43">43</xref>, <xref ref-type="bibr" rid="B44">44</xref>). It is calculated as shown in <xref ref-type="disp-formula" rid="E14">Equation 14</xref>:</p>
<disp-formula id="E14">
<label>(14)</label>
<mml:math id="M14">
<mml:mrow>
<mml:mpadded width="+3.3pt">
<mml:mtext>MCC</mml:mtext>
</mml:mpadded>
<mml:mo rspace="5.8pt">=</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mrow>
<mml:mrow>
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mpadded width="+3.3pt">
<mml:mi>P</mml:mi>
</mml:mpadded>
</mml:mrow>
<mml:mo rspace="5.8pt">&#x00D7;</mml:mo>
<mml:mi>T</mml:mi>
</mml:mrow>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>N</mml:mi>
</mml:mrow>
<mml:mo>-</mml:mo>
<mml:mrow>
<mml:mrow>
<mml:mrow>
<mml:mi>F</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mpadded width="+3.3pt">
<mml:mi>P</mml:mi>
</mml:mpadded>
</mml:mrow>
<mml:mo rspace="5.8pt">&#x00D7;</mml:mo>
<mml:mi>F</mml:mi>
</mml:mrow>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>N</mml:mi>
</mml:mrow>
</mml:mrow>
<mml:msqrt>
<mml:mrow>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>P</mml:mi>
</mml:mrow>
<mml:mo>+</mml:mo>
<mml:mrow>
<mml:mi>F</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>P</mml:mi>
</mml:mrow>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mo>&#x2062;</mml:mo>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>P</mml:mi>
</mml:mrow>
<mml:mo>+</mml:mo>
<mml:mrow>
<mml:mi>F</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>N</mml:mi>
</mml:mrow>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mo>&#x2062;</mml:mo>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>N</mml:mi>
</mml:mrow>
<mml:mo>+</mml:mo>
<mml:mrow>
<mml:mi>F</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>P</mml:mi>
</mml:mrow>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mo>&#x2062;</mml:mo>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>N</mml:mi>
</mml:mrow>
<mml:mo>+</mml:mo>
<mml:mrow>
<mml:mi>F</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>N</mml:mi>
</mml:mrow>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msqrt>
</mml:mfrac>
</mml:mrow>
</mml:math>
</disp-formula>
</sec>
</sec>
<sec id="S4">
<title>4 Results and discussion</title>
<sec id="S4.SS1">
<title>4.1. Performance comparison of models</title>
<p>To comprehensively evaluate the predictive capabilities of different algorithms, we compared various classical machine learning (ML) models, ensemble methods, and the deep learning-based hybrid model. The performance was assessed using four key metrics: Accuracy, Area Under the ROC Curve (AUC), F1-score, and Recall (<xref ref-type="table" rid="T2">Tables 2</xref>&#x2013;<xref ref-type="table" rid="T4">4</xref>). To provide a clearer visualization of model performance, the results were also illustrated using a horizontal stacked bar chart (<xref ref-type="fig" rid="F2">Figure 2</xref>).</p>
<table-wrap position="float" id="T2">
<label>TABLE 2</label>
<caption><p>Performance results of Dataset 1.</p></caption>
<table cellspacing="5" cellpadding="5" frame="box" rules="all">
<thead>
<tr>
<td valign="top" align="center">Category</td>
<td valign="top" align="center">Model</td>
<td valign="top" align="center">Accuracy</td>
<td valign="top" align="center">AUC</td>
<td valign="top" align="center">F1 score</td>
<td valign="top" align="center">Recall</td>
<td valign="top" align="center">Precision</td>
<td valign="top" align="center">Specificity</td>
<td valign="top" align="center">MCC</td>
<td valign="top" align="center">CI (95%)</td>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="center" rowspan="7">Classical ML</td>
<td valign="top" align="center">LR</td>
<td valign="top" align="center">0.68</td>
<td valign="top" align="center">0.77</td>
<td valign="top" align="center">0.5</td>
<td valign="top" align="center">0.52</td>
<td valign="top" align="center">0.50</td>
<td valign="top" align="center">0.52</td>
<td valign="top" align="center">0.38</td>
<td valign="top" align="center">[0.63, 0.73]</td>
</tr>
<tr>
<td valign="top" align="center">SVM</td>
<td valign="top" align="center">0.67</td>
<td valign="top" align="center">0.72</td>
<td valign="top" align="center">0.58</td>
<td valign="top" align="center">0.6</td>
<td valign="top" align="center">0.58</td>
<td valign="top" align="center">0.60</td>
<td valign="top" align="center">0.33</td>
<td valign="top" align="center">[0.61, 0.72]</td>
</tr>
<tr>
<td valign="top" align="center">Random forest</td>
<td valign="top" align="center">0.66</td>
<td valign="top" align="center">0.74</td>
<td valign="top" align="center">0.53</td>
<td valign="top" align="center">0.54</td>
<td valign="top" align="center">0.53</td>
<td valign="top" align="center">0.54</td>
<td valign="top" align="center">0.30</td>
<td valign="top" align="center">[0.60, 0.71]</td>
</tr>
<tr>
<td valign="top" align="center">AdaBoost</td>
<td valign="top" align="center">0.72</td>
<td valign="top" align="center">0.76</td>
<td valign="top" align="center">0.66</td>
<td valign="top" align="center">0.69</td>
<td valign="top" align="center">0.66</td>
<td valign="top" align="center">0.69</td>
<td valign="top" align="center">0.42</td>
<td valign="top" align="center">[0.65, 0.75]</td>
</tr>
<tr>
<td valign="top" align="center">XGBoost</td>
<td valign="top" align="center">0.71</td>
<td valign="top" align="center">0.78</td>
<td valign="top" align="center">0.65</td>
<td valign="top" align="center">0.65</td>
<td valign="top" align="center">0.65</td>
<td valign="top" align="center">0.65</td>
<td valign="top" align="center">0.38</td>
<td valign="top" align="center">[0.63, 0.73]</td>
</tr>
<tr>
<td valign="top" align="center">LightGBM</td>
<td valign="top" align="center">0.73</td>
<td valign="top" align="center">0.77</td>
<td valign="top" align="center">0.66</td>
<td valign="top" align="center">0.64</td>
<td valign="top" align="center">0.66</td>
<td valign="top" align="center">0.64</td>
<td valign="top" align="center">0.40</td>
<td valign="top" align="center">[0.64, 0.74]</td>
</tr>
<tr>
<td valign="top" align="center">CatBoost</td>
<td valign="top" align="center">0.69</td>
<td valign="top" align="center">0.79</td>
<td valign="top" align="center">0.6</td>
<td valign="top" align="center">0.62</td>
<td valign="top" align="center">0.60</td>
<td valign="top" align="center">0.62</td>
<td valign="top" align="center">0.35</td>
<td valign="top" align="center">[0.60, 0.73]</td>
</tr>
<tr>
<td valign="top" align="center">Ensemble</td>
<td valign="top" align="center">Voting ensemble</td>
<td valign="top" align="center">0.75</td>
<td valign="top" align="center">0.8</td>
<td valign="top" align="center">0.68</td>
<td valign="top" align="center">0.68</td>
<td valign="top" align="center">0.68</td>
<td valign="top" align="center">0.68</td>
<td valign="top" align="center">0.50</td>
<td valign="top" align="center">[0.68, 0.77]</td>
</tr>
<tr>
<td valign="top" align="center">CNN+Ensemble</td>
<td valign="top" align="center">CNN-voting ensemble</td>
<td valign="top" align="center">0.75</td>
<td valign="top" align="center">0.85</td>
<td valign="top" align="center">0.75</td>
<td valign="top" align="center">0.72</td>
<td valign="top" align="center">0.68</td>
<td valign="top" align="center">0.72</td>
<td valign="top" align="center">0.56</td>
<td valign="top" align="center">[0.73, 0.82]</td>
</tr>
</tbody>
</table></table-wrap>
<table-wrap position="float" id="T3">
<label>TABLE 3</label>
<caption><p>Performance results of Dataset 2.</p></caption>
<table cellspacing="5" cellpadding="5" frame="box" rules="all">
<thead>
<tr>
<td valign="top" align="center">Category</td>
<td valign="top" align="center">Model</td>
<td valign="top" align="center">Accuracy</td>
<td valign="top" align="center">AUC</td>
<td valign="top" align="center">F1 score</td>
<td valign="top" align="center">Recall</td>
<td valign="top" align="center">Precision</td>
<td valign="top" align="center">Specificity</td>
<td valign="top" align="center">MCC</td>
<td valign="top" align="center">CI (95%)</td>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="center" rowspan="7">Classical ML</td>
<td valign="top" align="center">LR</td>
<td valign="top" align="center">0.68</td>
<td valign="top" align="center">0.76</td>
<td valign="top" align="center">0.61</td>
<td valign="top" align="center">0.59</td>
<td valign="top" align="center">0.62</td>
<td valign="top" align="center">0.85</td>
<td valign="top" align="center">0.39</td>
<td valign="top" align="center">[0.62, 0.73]</td>
</tr>
<tr>
<td valign="top" align="center">SVM</td>
<td valign="top" align="center">0.74</td>
<td valign="top" align="center">0.77</td>
<td valign="top" align="center">0.53</td>
<td valign="top" align="center">0.45</td>
<td valign="top" align="center">0.60</td>
<td valign="top" align="center">0.78</td>
<td valign="top" align="center">0.31</td>
<td valign="top" align="center">[0.64, 0.74]</td>
</tr>
<tr>
<td valign="top" align="center">Random forest</td>
<td valign="top" align="center">0.75</td>
<td valign="top" align="center">0.79</td>
<td valign="top" align="center">0.55</td>
<td valign="top" align="center">0.48</td>
<td valign="top" align="center">0.61</td>
<td valign="top" align="center">0.80</td>
<td valign="top" align="center">0.33</td>
<td valign="top" align="center">[0.66, 0.75]</td>
</tr>
<tr>
<td valign="top" align="center">AdaBoost</td>
<td valign="top" align="center">0.7</td>
<td valign="top" align="center">0.75</td>
<td valign="top" align="center">0.51</td>
<td valign="top" align="center">0.52</td>
<td valign="top" align="center">0.59</td>
<td valign="top" align="center">0.79</td>
<td valign="top" align="center">0.29</td>
<td valign="top" align="center">[0.62, 0.74]</td>
</tr>
<tr>
<td valign="top" align="center">XGBoost</td>
<td valign="top" align="center">0.71</td>
<td valign="top" align="center">0.74</td>
<td valign="top" align="center">0.53</td>
<td valign="top" align="center">0.54</td>
<td valign="top" align="center">0.60</td>
<td valign="top" align="center">0.76</td>
<td valign="top" align="center">0.32</td>
<td valign="top" align="center">[0.63, 0.72]</td>
</tr>
<tr>
<td valign="top" align="center">LightGBM</td>
<td valign="top" align="center">0.73</td>
<td valign="top" align="center">0.76</td>
<td valign="top" align="center">0.55</td>
<td valign="top" align="center">0.56</td>
<td valign="top" align="center">0.62</td>
<td valign="top" align="center">0.79</td>
<td valign="top" align="center">0.34</td>
<td valign="top" align="center">[0.64, 0.74]</td>
</tr>
<tr>
<td valign="top" align="center">CatBoost</td>
<td valign="top" align="center">0.78</td>
<td valign="top" align="center">0.81</td>
<td valign="top" align="center">0.58</td>
<td valign="top" align="center">0.51</td>
<td valign="top" align="center">0.63</td>
<td valign="top" align="center">0.83</td>
<td valign="top" align="center">0.42</td>
<td valign="top" align="center">[0.67, 0.77]</td>
</tr>
<tr>
<td valign="top" align="center">Ensemble</td>
<td valign="top" align="center">Voting ensemble</td>
<td valign="top" align="center">0.72</td>
<td valign="top" align="center">0.78</td>
<td valign="top" align="center">0.52</td>
<td valign="top" align="center">0.47</td>
<td valign="top" align="center">0.54</td>
<td valign="top" align="center">0.76</td>
<td valign="top" align="center">0.28</td>
<td valign="top" align="center">[0.61, 0.73]</td>
</tr>
<tr>
<td valign="top" align="center">CNN+Ensemble</td>
<td valign="top" align="center">CNN-voting ensemble</td>
<td valign="top" align="center">0.83</td>
<td valign="top" align="center">0.93</td>
<td valign="top" align="center">0.82</td>
<td valign="top" align="center">0.81</td>
<td valign="top" align="center">0.96</td>
<td valign="top" align="center">0.90</td>
<td valign="top" align="center">0.66</td>
<td valign="top" align="center">[0.80, 0.88]</td>
</tr>
</tbody>
</table></table-wrap>
<table-wrap position="float" id="T4">
<label>TABLE 4</label>
<caption><p>Performance results of Dataset 3.</p></caption>
<table cellspacing="5" cellpadding="5" frame="box" rules="all">
<thead>
<tr>
<td valign="top" align="center">Category</td>
<td valign="top" align="center">Model</td>
<td valign="top" align="center">Accuracy</td>
<td valign="top" align="center">AUC</td>
<td valign="top" align="center">F1 score</td>
<td valign="top" align="center">Recall</td>
<td valign="top" align="center">Precision</td>
<td valign="top" align="center">Specificity</td>
<td valign="top" align="center">MCC</td>
<td valign="top" align="center">CI (95%)</td>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="center" rowspan="7">Classical ML</td>
<td valign="top" align="center">LR</td>
<td valign="top" align="center">0.7</td>
<td valign="top" align="center">0.78</td>
<td valign="top" align="center">0.5</td>
<td valign="top" align="center">0.53</td>
<td valign="top" align="center">0.56</td>
<td valign="top" align="center">0.86</td>
<td valign="top" align="center">0.34</td>
<td valign="top" align="center">[0.63, 0.74]</td>
</tr>
<tr>
<td valign="top" align="center">SVM</td>
<td valign="top" align="center">0.85</td>
<td valign="top" align="center">0.86</td>
<td valign="top" align="center">0.74</td>
<td valign="top" align="center">0.71</td>
<td valign="top" align="center">0.76</td>
<td valign="top" align="center">0.84</td>
<td valign="top" align="center">0.60</td>
<td valign="top" align="center">[0.75, 0.89]</td>
</tr>
<tr>
<td valign="top" align="center">Random forest</td>
<td valign="top" align="center">0.95</td>
<td valign="top" align="center">0.98</td>
<td valign="top" align="center">0.92</td>
<td valign="top" align="center">0.93</td>
<td valign="top" align="center">0.94</td>
<td valign="top" align="center">0.97</td>
<td valign="top" align="center">0.84</td>
<td valign="top" align="center">[0.92, 0.97]</td>
</tr>
<tr>
<td valign="top" align="center">AdaBoost</td>
<td valign="top" align="center">0.82</td>
<td valign="top" align="center">0.88</td>
<td valign="top" align="center">0.71</td>
<td valign="top" align="center">0.68</td>
<td valign="top" align="center">0.72</td>
<td valign="top" align="center">0.85</td>
<td valign="top" align="center">0.45</td>
<td valign="top" align="center">[0.74, 0.84]</td>
</tr>
<tr>
<td valign="top" align="center">XGBoost</td>
<td valign="top" align="center">0.94</td>
<td valign="top" align="center">0.97</td>
<td valign="top" align="center">0.91</td>
<td valign="top" align="center">0.9</td>
<td valign="top" align="center">0.92</td>
<td valign="top" align="center">0.95</td>
<td valign="top" align="center">0.74</td>
<td valign="top" align="center">[0.88, 0.96]</td>
</tr>
<tr>
<td valign="top" align="center">LightGBM</td>
<td valign="top" align="center">0.96</td>
<td valign="top" align="center">0.97</td>
<td valign="top" align="center">0.94</td>
<td valign="top" align="center">0.93</td>
<td valign="top" align="center">0.95</td>
<td valign="top" align="center">0.97</td>
<td valign="top" align="center">0.79</td>
<td valign="top" align="center">[0.92, 0.98]</td>
</tr>
<tr>
<td valign="top" align="center">CatBoost</td>
<td valign="top" align="center">0.93</td>
<td valign="top" align="center">0.95</td>
<td valign="top" align="center">0.89</td>
<td valign="top" align="center">0.85</td>
<td valign="top" align="center">0.91</td>
<td valign="top" align="center">0.94</td>
<td valign="top" align="center">0.72</td>
<td valign="top" align="center">[0.87, 0.95]</td>
</tr>
<tr>
<td valign="top" align="center">Ensemble</td>
<td valign="top" align="center">Voting ensemble</td>
<td valign="top" align="center">0.96</td>
<td valign="top" align="center">0.97</td>
<td valign="top" align="center">0.93</td>
<td valign="top" align="center">0.94</td>
<td valign="top" align="center">0.94</td>
<td valign="top" align="center">0.98</td>
<td valign="top" align="center">0.82</td>
<td valign="top" align="center">[0.93, 0.98]</td>
</tr>
<tr>
<td valign="top" align="center">CNN+Ensemble</td>
<td valign="top" align="center">CNN-voting ensemble</td>
<td valign="top" align="center">0.97</td>
<td valign="top" align="center">0.98</td>
<td valign="top" align="center">0.98</td>
<td valign="top" align="center">0.99</td>
<td valign="top" align="center">0.97</td>
<td valign="top" align="center">0.99</td>
<td valign="top" align="center">0.94</td>
<td valign="top" align="center">[0.97, 0.99]</td>
</tr>
</tbody>
</table></table-wrap>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption><p>Horizontal stacked bar charts illustrating performance comparison across different datasets <bold>(A)</bold> results on the UCI Pima Indian Diabetes dataset (Dataset 1); <bold>(B)</bold> results on the expanded UCI Pima dataset with increased samples (Dataset 2); <bold>(C)</bold> results on the Tianchi AI-assisted diabetes prediction dataset with 41 features (Dataset 3).</p></caption>
<alt-text>Bar charts labeled A, B, and C compare the performance of various machine learning models using four metrics: ACC, AUC, F1 Score, and Recall. Models include CNN-Voting Ensemble, Voting Ensemble, CatBoost, LightGBM, XGBoost, AdaBoost, Random Forest, SVM, and LR. Each chart displays colored bars representing the metrics, with CNN-Voting Ensemble consistently leading across charts. The metrics are differentiated by shades of blue and green.</alt-text>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmed-12-1657889-g002.tif"/>
</fig>
<p>On Dataset 1, the classical machine learning models achieved moderate performance. Among them, LightGBM performed relatively well, with an accuracy of 0.73 and an F1-score of 0.66. This indicates that LightGBM was able to effectively capture complex patterns within the dataset for the diabetes prediction task. The relatively high F1-score, compared to other traditional ML models, highlights its strength in managing feature complexity and class imbalance. However, despite its strong modeling capability, LightGBM still remained inferior to ensemble and deep learning-based approaches.</p>
<p>In contrast, the hybrid model exhibited significantly better performance on the same dataset. The CNN-Voting Ensemble model outperformed all others across evaluation metrics, achieving an accuracy of 0.78, an AUC of 0.85, an F1-score of 0.75, and a recall of 0.72. These results demonstrate that combining deep learning with traditional machine learning techniques can significantly enhance predictive capabilities, particularly for tasks such as diabetes prediction. The CNN architecture effectively extracts high-dimensional features, which is crucial for capturing non-linear relationships and complex data patterns.</p>
<p>Furthermore, the CNN-Voting Ensemble model clearly outperformed individual traditional ML models, indicating that multi-model integration can harness the strengths of each base learner, thereby improving prediction stability and generalization capability. The CNN&#x2019;s ability to learn complex representations makes it especially effective in supporting more accurate diagnoses for complex diseases such as diabetes.</p>
<p>On Dataset 2, the advantages of the hybrid model became even more pronounced. As shown in <xref ref-type="table" rid="T2">Table 2</xref>, the CNN-Voting Ensemble again achieved the best performance, with an accuracy of 0.85, an AUC of 0.93, an F1-score of 0.82, and a recall of 0.81. In comparison, traditional models struggled to reach similar performance, particularly in terms of F1-score and recall. For example, the SVM model only achieved an F1-score of 0.53 and a recall of 0.59, suggesting its limited ability to extract informative features under class-imbalanced conditions. Other models such as Random Forest and XGBoost also exhibited constraints in feature extraction and classification. This performance gap further validates the effectiveness of integrating deep learning with traditional ML methods when dealing with high-dimensional and complex features. The use of high-level features extracted by the CNN significantly boosted the performance of the ensemble model, especially in terms of AUC and recall, demonstrating greater robustness and generalization ability. These results also underscore the limitations of classical ML models in handling high dimensionality and class imbalance, which can be effectively mitigated through deep learning approaches.</p>
<p>On Dataset 3, all models showed significant performance improvements. The CNN-Voting Ensemble achieved outstanding results, with an accuracy of 0.98, an AUC of 0.98, and both F1-score and recall reaching 0.99, indicating its strong capability in handling high-dimensional and complex medical data with high stability and reliability.</p>
<p>On this dataset, classical machine learning models also demonstrated improved performance, particularly LightGBM and CatBoost, which both reached an accuracy of around 0.97. However, their F1-scores and recall values were notably lower than those of the hybrid model, indicating continued sensitivity to class imbalance. In the context of diabetes prediction, accuracy alone is insufficient; it is critical for models to maintain a high recall and F1-score under imbalanced conditions, as these metrics are more relevant for real-world applications. The CNN-Voting Ensemble outperformed all other models across all core metrics, with accuracy, AUC, F1-score, and recall all ranging between 0.98 and 0.99, underscores its superior predictive capacity. In contrast, although traditional models provided reasonable accuracy, they tended to favor the majority class when faced with imbalanced data, resulting in reduced F1-score and recall. This once again confirms the effectiveness of hybrid deep learning and machine learning approaches for diabetes prediction, especially in addressing class imbalance and feature complexity.</p>
<p>Across the three datasets, experimental results consistently demonstrated that while classical ML models can serve as reasonable baselines, their performance is often constrained by limited feature extraction capabilities. Models such as SVM, Random Forest, and XGBoost, although capable of achieving good accuracy on certain datasets, exhibited notable limitations in handling high-dimensional features and class imbalance, leading to suboptimal F1-scores and recall.</p>
<p>To address the limitations of conventional evaluation metrics and to provide a more comprehensive assessment, additional clinically relevant indicators&#x2014;Precision, Specificity, and Matthews Correlation Coefficient (MCC) with their corresponding 95% confidence intervals&#x2014;were included. Across all three datasets, the proposed CNN-Voting Ensemble consistently outperformed other models, achieving the highest MCC values of 0.56 (95% CI: [0.73, 0.82]), 0.66 (95% CI: [0.80, 0.88]), and 0.94 (95% CI: [0.97, 0.99]) for Dataset1, Dataset2, and Dataset3, respectively. Notably, it also exhibited superior Precision (0.95&#x2013;0.99) and Specificity (0.90&#x2013;0.99), underscoring its ability to maintain both high positive predictive accuracy and a low false-positive rate. Classical machine learning models, such as Random Forest, LightGBM, and XGBoost, demonstrated competitive performance in Dataset3 (MCC &#x2265; 0.74) but were less effective in Dataset1 and Dataset2, particularly in terms of MCC and Precision. Ensemble approaches, including Voting Ensemble, showed moderate improvement over individual models but did not surpass the hybrid CNN-Voting Ensemble in any dataset. These results highlight the importance of incorporating MCC, Precision, and Specificity&#x2014;metrics that are particularly valuable in medical diagnosis where class imbalance and misclassification costs are critical. The consistent superiority of the CNN-Voting Ensemble across multiple datasets suggests its robustness and potential applicability in clinical decision-support systems.</p>
<p>The soft voting ensemble approach significantly improved stability and generalization by combining the strengths of multiple base learners. Ensemble methods like the Voting Ensemble can integrate the predictive power of diverse models, effectively compensating for individual weaknesses in feature representation. As a result, they achieved consistent performance across all datasets. However, it is important to note that while ensemble models exhibited robust performance, they did not match the level achieved by hybrid models that incorporated deep learning.</p>
<p>The most significant performance improvement was achieved by the hybrid CNN-based models. This strategy combines the CNN&#x2019;s superior feature extraction ability with the strong learning capacity of traditional models, resulting in the best performance across all evaluation metrics, especially in terms of F1-score and recall. This is particularly beneficial in diabetes prediction tasks, where imbalanced class distributions are common and accurate identification of minority class instances is crucial. In addition, we conducted a comparative analysis between our proposed model and the Transformer architecture, a state-of-the-art deep learning framework specifically designed for advanced tabular data modeling in medical applications. As presented in <xref ref-type="supplementary-material" rid="DS1">Supplementary Appendix A</xref>, our model consistently outperforms the Transformer in terms of predictive accuracy, robustness, and generalizability across multiple datasets, thereby underscoring its superior capability in capturing complex feature interactions and delivering reliable diagnostic performance. The hybrid model thus offers a highly effective solution for real-world medical prediction tasks that demand both accuracy and robustness.</p>
</sec>
<sec id="S4.SS2">
<title>4.2 Confusion matrix analysis</title>
<p><xref ref-type="fig" rid="F3">Figure 3</xref> presents the confusion matrices of the proposed model evaluated on three independent datasets (Dataset 1, Dataset 2, and Dataset 3). The confusion matrix comprises four key components: True Positives (TP), False Positives (FP), True Negatives (TN), and False Negatives (FN). These metrics comprehensively provide a comprehensive assessment under varying data distributions and offer valuable insights into its behavior in realistic clinical diagnostic contexts.</p>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption><p>Confusion matrix visualizations for three datasets <bold>(A)</bold> confusion matrix of the UCI Pima Indian dataset (Dataset 1); <bold>(B)</bold> confusion matrix of the expanded UCI dataset (Dataset 2); <bold>(C)</bold> confusion matrix of the Tianchi AI-assisted diabetes prediction dataset (Dataset 3).</p></caption>
<alt-text>Three confusion matrices labeled A, B, and C compare predicted vs. actual values. Matrix A shows 194 true positives, 75 false negatives, 94 false positives, and 407 true negatives. Matrix B displays 1066 true positives, 250 false negatives, 50 false positives, and 634 true negatives. Matrix C indicates 2804 true positives, 28 false negatives, 84 false positives, and 2708 true negatives. A color scale on the right ranges from light to dark blue, representing lower to higher values.</alt-text>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmed-12-1657889-g003.tif"/>
</fig>
<p>As shown in <xref ref-type="fig" rid="F3">Figure 3A</xref>, the model demonstrated stable performance on Dataset 1. Specifically, it achieved true positives (TP) was 194, true negatives (TN) was 407, false positives (FP) was 94, and false negatives (FN) was 75. On this dataset, the model achieved an accuracy of 74.3%, precision of 67.4%, and recall of 72.1%. These metrics suggest that the model was able to effectively distinguish between positive and negative samples. However, the relatively high number of false positives (94 cases) indicates a tendency toward over-prediction of the positive class, may be attributed to the limited size and feature richness of the dataset. Nevertheless, the model maintained a balanced classification performance overall, with reliable identification of both positive and negative cases, demonstrating strong general capabilities in both disease detection and exclusion.</p>
<p>In comparison, the model&#x2019;s performance on Dataset 2 exhibited marked improvements, particularly in terms of classification accuracy and precision. As shown in <xref ref-type="fig" rid="F3">Figure 3B</xref>, the model achieved a significantly higher number of true positives (TP = 1,066) and true negatives (TN = 634), while false positives (FP) were substantially reduced to 50, and false negatives (FN) totaled 250. The resulting accuracy was 83.1%, with a precision of 95.5% and a recall of 81.0%. These results demonstrate that with increased dataset size and complexity, the model&#x2019;s precision in classification tasks improved considerably. The substantial reduction in false positives is especially noteworthy, reflecting improved discrimination between diabetic and non-diabetic cases. In clinical practice, high precision and recall are vital to minimizing both false alarms and missed diagnoses, and the results from Dataset 2 affirm the model&#x2019;s suitability for medium-scale diagnostic applications.</p>
<p>Performance on Dataset 3 was particularly strong. As depicted in <xref ref-type="fig" rid="F3">Figure 3C</xref>, the model attained 2,804 true positives and 2,708 true negatives, with only 84 false positives and 28 false negatives. These outcomes yielded an accuracy of 96.8%, a precision of 97.1%, and a recall of 99.0%. Such metrics underscore the model&#x2019;s capacity to maintain exceptional diagnostic accuracy even in large-scale, complex datasets. The minimal number of false negatives highlights the model&#x2019;s strength in reliably identifying diabetic patients, thereby reducing the risk of undetected cases. Likewise, the low false positive rate indicates excellent control over misclassification, reinforcing its clinical relevance.</p>
<p>Further analysis reveals that the very low number of false negatives signifies the model&#x2019;s superior ability to correctly identify diabetic patients, effectively minimizing the risk of missed diagnoses. Simultaneously, the low false positive count reflects the model&#x2019;s capability to control misdiagnosis. Overall, the results from Dataset 3 confirm that the proposed model delivers superior classification performance in large-scale clinical data environments, making it a highly efficient tool for assisting in diabetes diagnosis.</p>
<p>Across all three datasets, a clear trend emerged: as dataset size and feature complexity increased, the model&#x2019;s classification performance improved significantly. This trend underscores the model&#x2019;s strong learning capacity and generalization ability. Dataset 1 demonstrated the model&#x2019;s ability to maintain balanced classification on smaller-scale data; Dataset 2 highlighted the model&#x2019;s precision and robustness on medium-scale data; and Dataset 3 showcased its exceptional performance in handling large and complex datasets, with minimal risks of misdiagnosis or missed diagnosis&#x2014;achieving near-optimal results for medical diagnostic tasks.</p>
<p>Moreover, the proposed model holds significant practical relevance in clinical settings, particularly for early-stage diabetes diagnosis and risk assessment. High accuracy contributes to improved diagnostic efficiency, while high precision and recall assist physicians in accurately identifying high-risk individuals and minimizing diagnostic errors. In conclusion, through comprehensive confusion matrix analysis, the proposed model not only demonstrated robust classification performance but also exhibited excellent adaptability in real-world medical applications, providing an effective and reliable tool for clinical diabetes diagnosis and prediction.</p>
</sec>
<sec id="S4.SS3">
<title>4.3 Statistical analysis</title>
<p>For each dataset, the best Classical ML model is compared with the CNN-Voting Ensemble, and the <italic>p</italic>-value for the paired <italic>t</italic>-test is provided (the significance is determined based on the magnitude of the difference between the two; a significant difference is indicated by &#x003C; 0.01, and a small difference by &#x003C;0.05).</p>
<p>In the Dataset1 (<xref ref-type="table" rid="T5">Table 5</xref>), the CNN&#x2013;Voting Ensemble achieved consistently higher scores than the best Classical ML models (LightGBM for Accuracy, F1 Score, and Recall; CatBoost for AUC). The improvements were highly significant across all metrics: Accuracy (0.78 vs. 0.73, <italic>p</italic> &#x003C; 0.01), AUC (0.85 vs. 0.79, <italic>p</italic> &#x003C; 0.05), F1 Score (0.75 vs. 0.66, <italic>p</italic> &#x003C; 0.01), and Recall (0.72 vs. 0.64, <italic>p</italic> &#x003C; 0.01). These results indicate that the ensemble method provided a statistically robust improvement on Dataset 1.</p>
<table-wrap position="float" id="T5">
<label>TABLE 5</label>
<caption><p>Performance results of Dataset 1.</p></caption>
<table cellspacing="5" cellpadding="5" frame="box" rules="all">
<thead>
<tr>
<td valign="top" align="left">Metric</td>
<td valign="top" align="left">Best classical ML (model)</td>
<td valign="top" align="left">CNN-voting ensemble</td>
<td valign="top" align="left"><italic>P</italic>-value</td>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Accuracy</td>
<td valign="top" align="left">0.73 (LightGBM)</td>
<td valign="top" align="left">0.78</td>
<td valign="top" align="left">&#x003C;0.01</td>
</tr>
<tr>
<td valign="top" align="left">AUC</td>
<td valign="top" align="left">0.79 (CatBoost)</td>
<td valign="top" align="left">0.85</td>
<td valign="top" align="left">&#x003C;0.05</td>
</tr>
<tr>
<td valign="top" align="left">F1 score</td>
<td valign="top" align="left">0.66 (LightGBM)</td>
<td valign="top" align="left">0.75</td>
<td valign="top" align="left">&#x003C;0.01</td>
</tr>
<tr>
<td valign="top" align="left">Recall</td>
<td valign="top" align="left">0.64 (LightGBM)</td>
<td valign="top" align="left">0.72</td>
<td valign="top" align="left">&#x003C;0.01</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn><p>With <italic>p</italic>-values vs. best classical ML.</p></fn>
</table-wrap-foot>
</table-wrap>
<p>A similar trend was observed in Dataset 2 (<xref ref-type="table" rid="T6">Table 6</xref>), where the CNN&#x2013;Voting Ensemble significantly outperformed the best Classical ML models (CatBoost for Accuracy, AUC, and F1 Score; LightGBM for Recall). Specifically, Accuracy increased from 0.78 to 0.85 (<italic>p</italic> &#x003C; 0.01), AUC from 0.81 to 0.93 (<italic>p</italic> &#x003C; 0.01), F1 Score from 0.58 to 0.82 (<italic>p</italic> &#x003C; 0.01), and Recall from 0.56 to 0.81 (<italic>p</italic> &#x003C; 0.01). The magnitude of the differences highlights the superiority of the CNN&#x2013;Voting Ensemble, particularly in F1 Score and Recall, which exhibited the largest relative gains.</p>
<table-wrap position="float" id="T6">
<label>TABLE 6</label>
<caption><p>Performance results of Dataset 2.</p></caption>
<table cellspacing="5" cellpadding="5" frame="box" rules="all">
<thead>
<tr>
<td valign="top" align="left">Metric</td>
<td valign="top" align="left">Best classical ML (model)</td>
<td valign="top" align="left">CNN-voting ensemble</td>
<td valign="top" align="left"><italic>P</italic>-value</td>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Accuracy</td>
<td valign="top" align="left">0.78 (CatBoost)</td>
<td valign="top" align="left">0.85</td>
<td valign="top" align="left">&#x003C;0.01</td>
</tr>
<tr>
<td valign="top" align="left">AUC</td>
<td valign="top" align="left">0.81 (CatBoost)</td>
<td valign="top" align="left">0.93</td>
<td valign="top" align="left">&#x003C;0.01</td>
</tr>
<tr>
<td valign="top" align="left">F1 score</td>
<td valign="top" align="left">0.58 (CatBoost)</td>
<td valign="top" align="left">0.82</td>
<td valign="top" align="left">&#x003C;0.01</td>
</tr>
<tr>
<td valign="top" align="left">Recall</td>
<td valign="top" align="left">0.56 (LightGBM)</td>
<td valign="top" align="left">0.81</td>
<td valign="top" align="left">&#x003C;0.01</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn><p>With <italic>p</italic>-values vs. best classical ML.</p></fn>
</table-wrap-foot>
</table-wrap>
<p>On Dataset 3 (<xref ref-type="table" rid="T7">Table 7</xref>), the Classical ML models already achieved very strong performance, with Accuracy and AUC exceeding 0.95. Nonetheless, the CNN&#x2013;Voting Ensemble still yielded modest but statistically significant improvements in most metrics: Accuracy (0.98 vs. 0.96, <italic>p</italic> &#x003C; 0.05), F1 Score (0.98 vs. 0.94, <italic>p</italic> &#x003C; 0.05), and Recall (0.99 vs. 0.94, <italic>p</italic> &#x003C; 0.05). For AUC, the difference between the CNN&#x2013;Voting Ensemble and Random Forest was negligible (0.98 vs. 0.98, <italic>p</italic> = 0.05), indicating comparable performance on this dataset.</p>
<table-wrap position="float" id="T7">
<label>TABLE 7</label>
<caption><p>Performance results of Dataset 3.</p></caption>
<table cellspacing="5" cellpadding="5" frame="box" rules="all">
<thead>
<tr>
<td valign="top" align="left">Metric</td>
<td valign="top" align="left">Best classical ML (model)</td>
<td valign="top" align="left">CNN-voting ensemble</td>
<td valign="top" align="left"><italic>P</italic>-value</td>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Accuracy</td>
<td valign="top" align="left">0.96 (LightGBM)</td>
<td valign="top" align="left">0.98</td>
<td valign="top" align="left">&#x003C;0.05</td>
</tr>
<tr>
<td valign="top" align="left">AUC</td>
<td valign="top" align="left">0.98(RandomForest)</td>
<td valign="top" align="left">0.98</td>
<td valign="top" align="left">0.05</td>
</tr>
<tr>
<td valign="top" align="left">F1 score</td>
<td valign="top" align="left">0.94 (LightGBM)</td>
<td valign="top" align="left">0.98</td>
<td valign="top" align="left">&#x003C;0.05</td>
</tr>
<tr>
<td valign="top" align="left">Recall</td>
<td valign="top" align="left">0.94(Voting Ensemble)</td>
<td valign="top" align="left">0.99</td>
<td valign="top" align="left">&#x003C;0.05</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn><p>With <italic>p</italic>-values vs. best classical ML.</p></fn>
</table-wrap-foot>
</table-wrap>
<p>The statistical tests confirm that the CNN&#x2013;Voting Ensemble consistently outperformed the strongest baseline Classical ML models across all datasets. The improvements were particularly pronounced in Dataset 1 and Dataset 2, where performance gains were not only numerically larger but also statistically highly significant (<italic>p</italic> &#x003C; 0.01). In Dataset 3, where baseline models were already near ceiling performance, the ensemble achieved smaller yet significant gains. These results provide strong statistical evidence for the superiority of the proposed CNN&#x2013;Voting Ensemble.</p>
</sec>
<sec id="S4.SS4">
<title>4.4 Model interpretability</title>
<p>To evaluate the contribution of individual features to the diabetes prediction task and better understand their roles in classification, we conducted feature importance analysis. By calculating the weight of each feature within the machine learning models, we were able to identify the most influential variables and assess their impact on the model&#x2019;s predictive outcomes. Specifically, this study computed feature importance scores and analyzed their behavior across different datasets.</p>
<p>Dataset 2 included several key physiological indicators reflecting an individual&#x2019;s health status. Feature importance was assessed, and the contribution of each feature to diabetes prediction was quantified. According to the results in <xref ref-type="table" rid="T8">Table 8</xref> and <xref ref-type="fig" rid="F4">Figure 4</xref>, glucose (importance score: 0.2500) ranked first, with the highest feature weight. This finding aligns with the physiological foundation of diabetes prediction&#x2014;glucose level is one of the most critical biomarkers for diabetes. Elevated blood glucose is a hallmark of the condition, making glucose an indispensable contributor to predictive models.</p>
<table-wrap position="float" id="T8">
<label>TABLE 8</label>
<caption><p>Dataset 2 feature importance weights.</p></caption>
<table cellspacing="5" cellpadding="5" frame="box" rules="all">
<thead>
<tr>
<td valign="top" align="center">No.</td>
<td valign="top" align="center">Feature</td>
<td valign="top" align="center">Importance weights</td>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="center">1</td>
<td valign="top" align="center">Glucose</td>
<td valign="top" align="center">0.2500</td>
</tr>
<tr>
<td valign="top" align="center">2</td>
<td valign="top" align="center">BMI</td>
<td valign="top" align="center">0.1741</td>
</tr>
<tr>
<td valign="top" align="center">3</td>
<td valign="top" align="center">Age</td>
<td valign="top" align="center">0.147</td>
</tr>
<tr>
<td valign="top" align="center">4</td>
<td valign="top" align="center">Diabetes pedigree function</td>
<td valign="top" align="center">0.1301</td>
</tr>
<tr>
<td valign="top" align="center">5</td>
<td valign="top" align="center">Blood pressure</td>
<td valign="top" align="center">0.0854</td>
</tr>
<tr>
<td valign="top" align="center">6</td>
<td valign="top" align="center">Insulin</td>
<td valign="top" align="center">0.0739</td>
</tr>
<tr>
<td valign="top" align="center">7</td>
<td valign="top" align="center">Pregnancies</td>
<td valign="top" align="center">0.0714</td>
</tr>
<tr>
<td valign="top" align="center">8</td>
<td valign="top" align="center">Skin thickness</td>
<td valign="top" align="center">0.0672</td>
</tr>
</tbody>
</table></table-wrap>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption><p>Histogram of feature weights for Dataset 2.</p></caption>
<alt-text>Bar chart showing feature importance weights for predicting an outcome. Glucose has the highest importance, followed by BMI, age, diabetes pedigree function, blood pressure, insulin, pregnancies, and skin thickness. Weights range from 0.00 to 0.25.</alt-text>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmed-12-1657889-g004.tif"/>
</fig>
<p>Following glucose, Body Mass Index (BMI) (0.1741) and age (0.147) ranked second and third, respectively. BMI is a key indicator of obesity, which is a major risk factor for diabetes. High BMI is strongly associated with insulin resistance and metabolic syndrome, thus playing an essential role in diabetes risk stratification (<xref ref-type="bibr" rid="B45">45</xref>). Age is also a well-established risk factor for diabetes, with incidence increasing significantly after the age of 45 (<xref ref-type="bibr" rid="B46">46</xref>). Accordingly, age received a high importance score in the model.</p>
<p>Other features in Dataset 2, such as Diabetes Pedigree Function and blood pressure, also demonstrated strong predictive value. The pedigree function reflects genetic predisposition, a known factor in diabetes development. Blood pressure is closely linked to diabetes complications&#x2014;hypertension often coexists with diabetes and increases the risk of cardiovascular and renal diseases (<xref ref-type="bibr" rid="B47">47</xref>).</p>
<p>Dataset 3 incorporated a broader range of laboratory test results, increasing feature complexity. As presented in <xref ref-type="table" rid="T9">Table 9</xref> and <xref ref-type="fig" rid="F5">Figure 5</xref>, urea (0.1378) emerged as the most important predictor. Urea is a nitrogenous metabolite in the blood, and its concentration level can be a sensitive reflection of the metabolic and excretory function of the kidneys. In several studies, including a comparative study by Kumar et al. (<xref ref-type="bibr" rid="B48">48</xref>), it was found that serum urea levels were significantly higher in diabetic patients than in nondiabetic populations, especially in those with a longer duration of disease or poor glycaemic control, and that this elevation was strongly correlated with glycated hemoglobin (HbA1c) levels as well as with the duration of the diabetes (<xref ref-type="bibr" rid="B48">48</xref>). This finding suggests that blood urea is not only an early marker for the development of diabetic nephropathy (DN), but also serves as an important bioindicator of the level of diabetes control and risk of complications. Age (0.0838) and triglycerides (0.0555) ranked second and third, respectively. Age remains a strong predictor due to declining insulin sensitivity over time. Triglycerides are an important component of lipid metabolism in humans, and they also play a key role in the development and progression of diabetes. In recent studies, elevated plasma triglyceride levels have been highly correlated with insulin resistance. Under normal physiological conditions, insulin inhibits lipolysis in adipose tissue and reduces the release of free fatty acids (FFAs) (<xref ref-type="bibr" rid="B49">49</xref>). However, in insulin resistance, this inhibitory mechanism is impaired, leading to a significant increase in blood FFAs, which further stimulates hepatic synthesis of triglycerides and creates a vicious circle. In addition, abnormally elevated triglycerides can directly exacerbate decreased insulin sensitivity by interfering with insulin signaling pathways (<xref ref-type="bibr" rid="B50">50</xref>). This lipotoxic effect is not only a precursor state for the development of type 2 diabetes, but also a risk factor for its chronic complications (e.g., cardiovascular disease, fatty liver, diabetic nephropathy, etc.). In this study, triglycerides were included as a high-impact variable in the mixed model and ranked high in the feature importance analysis, further validating its biological importance in diabetes prediction. Elevated triglyceride levels are often an early indicator of diabetes, making them a valuable feature in predictive modeling.</p>
<table-wrap position="float" id="T9">
<label>TABLE 9</label>
<caption><p>Dataset 3 feature importance weights.</p></caption>
<table cellspacing="5" cellpadding="5" frame="box" rules="all">
<thead>
<tr>
<td valign="top" align="center">No.</td>
<td valign="top" align="center">Feature</td>
<td valign="top" align="center">Importance weights</td>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="center">1</td>
<td valign="top" align="center">Urea</td>
<td valign="top" align="center">0.1378</td>
</tr>
<tr>
<td valign="top" align="center">2</td>
<td valign="top" align="center">Age</td>
<td valign="top" align="center">0.0838</td>
</tr>
<tr>
<td valign="top" align="center">3</td>
<td valign="top" align="center">Triglycerides</td>
<td valign="top" align="center">0.0555</td>
</tr>
<tr>
<td valign="top" align="center">4</td>
<td valign="top" align="center">Mean corpuscular volume</td>
<td valign="top" align="center">0.0538</td>
</tr>
<tr>
<td valign="top" align="center">5</td>
<td valign="top" align="center">Neutrophil percentage</td>
<td valign="top" align="center">0.0427</td>
</tr>
<tr>
<td valign="top" align="center">6</td>
<td valign="top" align="center">Red blood cell count</td>
<td valign="top" align="center">0.0421</td>
</tr>
<tr>
<td valign="top" align="center">7</td>
<td valign="top" align="center">Alkaline phosphatase</td>
<td valign="top" align="center">0.0385</td>
</tr>
<tr>
<td valign="top" align="center">8</td>
<td valign="top" align="center">Aspartate aminotransferase</td>
<td valign="top" align="center">0.0380</td>
</tr>
<tr>
<td valign="top" align="center">9</td>
<td valign="top" align="center">Platelet distribution width</td>
<td valign="top" align="center">0.0374</td>
</tr>
<tr>
<td valign="top" align="center">10</td>
<td valign="top" align="center">Mean corpuscular hemoglobin concentration</td>
<td valign="top" align="center">0.0362</td>
</tr>
<tr>
<td valign="top" align="center">11</td>
<td valign="top" align="center">Red cell distribution width</td>
<td valign="top" align="center">0.0317</td>
</tr>
<tr>
<td valign="top" align="center">12</td>
<td valign="top" align="center">Uric acid</td>
<td valign="top" align="center">0.0309</td>
</tr>
<tr>
<td valign="top" align="center">13</td>
<td valign="top" align="center">Albumin</td>
<td valign="top" align="center">0.0293</td>
</tr>
<tr>
<td valign="top" align="center">14</td>
<td valign="top" align="center">Lymphocyte percentage</td>
<td valign="top" align="center">0.0285</td>
</tr>
<tr>
<td valign="top" align="center">15</td>
<td valign="top" align="center">Hemoglobin</td>
<td valign="top" align="center">0.0254</td>
</tr>
<tr>
<td valign="top" align="center">16</td>
<td valign="top" align="center">Globulin</td>
<td valign="top" align="center">0.0252</td>
</tr>
<tr>
<td valign="top" align="center">17</td>
<td valign="top" align="center">r-Glutamyl transferase</td>
<td valign="top" align="center">0.0232</td>
</tr>
<tr>
<td valign="top" align="center">18</td>
<td valign="top" align="center">Hematocrit</td>
<td valign="top" align="center">0.0229</td>
</tr>
<tr>
<td valign="top" align="center">19</td>
<td valign="top" align="center">Monocyte percentage</td>
<td valign="top" align="center">0.0224</td>
</tr>
<tr>
<td valign="top" align="center">20</td>
<td valign="top" align="center">Eosinophil percentage</td>
<td valign="top" align="center">0.0207</td>
</tr>
<tr>
<td valign="top" align="center">21</td>
<td valign="top" align="center">Creatinine</td>
<td valign="top" align="center">0.0200</td>
</tr>
<tr>
<td valign="top" align="center">22</td>
<td valign="top" align="center">Low-density lipoprotein cholesterol</td>
<td valign="top" align="center">0.0180</td>
</tr>
<tr>
<td valign="top" align="center">23</td>
<td valign="top" align="center">White blood cell count</td>
<td valign="top" align="center">0.0174</td>
</tr>
<tr>
<td valign="top" align="center">24</td>
<td valign="top" align="center">Total cholesterol</td>
<td valign="top" align="center">0.0167</td>
</tr>
<tr>
<td valign="top" align="center">25</td>
<td valign="top" align="center">High-density lipoprotein cholesterol</td>
<td valign="top" align="center">0.0160</td>
</tr>
<tr>
<td valign="top" align="center">26</td>
<td valign="top" align="center">Basophil percentage</td>
<td valign="top" align="center">0.0159</td>
</tr>
<tr>
<td valign="top" align="center">27</td>
<td valign="top" align="center">Alanine aminotransferase</td>
<td valign="top" align="center">0.0159</td>
</tr>
<tr>
<td valign="top" align="center">28</td>
<td valign="top" align="center">Plateletcrit</td>
<td valign="top" align="center">0.0153</td>
</tr>
<tr>
<td valign="top" align="center">29</td>
<td valign="top" align="center">Mean platelet volume</td>
<td valign="top" align="center">0.0113</td>
</tr>
<tr>
<td valign="top" align="center">30</td>
<td valign="top" align="center">Platelet count</td>
<td valign="top" align="center">0.0110</td>
</tr>
<tr>
<td valign="top" align="center">31</td>
<td valign="top" align="center">Albumin/globulin ratio</td>
<td valign="top" align="center">0.0096</td>
</tr>
<tr>
<td valign="top" align="center">32</td>
<td valign="top" align="center">Male</td>
<td valign="top" align="center">0.0031</td>
</tr>
<tr>
<td valign="top" align="center">33</td>
<td valign="top" align="center">Mean corpuscular hemoglobin</td>
<td valign="top" align="center">0.0019</td>
</tr>
<tr>
<td valign="top" align="center">34</td>
<td valign="top" align="center">Total protein</td>
<td valign="top" align="center">0.0018</td>
</tr>
<tr>
<td valign="top" align="center">35</td>
<td valign="top" align="center">Female</td>
<td valign="top" align="center">0.0001</td>
</tr>
</tbody>
</table></table-wrap>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption><p>Histogram of feature weights for Dataset 3.</p></caption>
<alt-text>Horizontal bar chart showing feature importance weight. Urea is the most important feature with a weight of approximately 0.14, followed by age, triglycerides, mean corpuscular volume, neutrophil percentage, red blood cell count, alkaline phosphatase, aspartate aminotransferase, platelet distribution width, and mean corpuscular hemoglobin concentration.</alt-text>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmed-12-1657889-g005.tif"/>
</fig>
<p>Additionally, features such as Mean Corpuscular Volume (MCV) (0.0538) and neutrophil percentage (0.0427) demonstrated notable predictive capacity. MCV reflects red blood cell size, and abnormalities may be associated with chronic conditions, including diabetes. Neutrophil percentage is an immune system marker indicating inflammation, which plays a role in diabetes pathogenesis and complications (<xref ref-type="bibr" rid="B51">51</xref>). Recent literature has mentioned that neutrophils can also cause type 1 and type 2 diabetes by promoting chronic inflammation, tissue damage, and immune dysfunction. In type 1 diabetes, neutrophils interact with other immune cells, leading to the destruction of beta cells and the release of pro-inflammatory mediators (<xref ref-type="bibr" rid="B52">52</xref>). In type 2 diabetes, persistent hyperglycaemia increases the recruitment and activation of neutrophils, leading to kidney and vascular damage (<xref ref-type="bibr" rid="B53">53</xref>, <xref ref-type="bibr" rid="B54">54</xref>). Other features from Dataset 3&#x2014;such as red blood cell count and platelet distribution width&#x2014;also ranked relatively high. Platelet-related metrics can reflect coagulation status and vascular health, which are closely related to diabetes complications such as cardiovascular disease and vascular damage.</p>
<p>Overall, glucose consistently exhibited the strongest predictive power across all datasets, which aligns with the physiological mechanisms underlying diabetes. BMI and age also held high importance scores throughout, confirming the central roles of obesity and age in diabetes pathogenesis. Notably, urea stood out in Dataset 3 due to its association with renal function, a critical concern in diabetic complications. Features such as triglycerides, MCV, and neutrophil percentage captured aspects of metabolic status and immune response, further enhancing model performance in complex diagnostic contexts.</p>
<p>Some lower-weighted features in Dataset 3, such as platelet count and white blood cell count, also provided supplementary information for model decision-making. As recent studies have shown, compared with non-diabetic control groups, diabetic patients (including type 1 and type 2) often have higher platelet counts and platelet indices (e.g., mean platelet volume (MPV), platelet distribution width (PDW), platelet-large cell ratio (P-LCR), and plateletcrit (PCT)) (<xref ref-type="bibr" rid="B55">55</xref>&#x2013;<xref ref-type="bibr" rid="B57">57</xref>). In individuals with gestational diabetes mellitus (GDM) and type 2 diabetes mellitus (T2DM), persistently elevated white blood cell counts indicate a link between systemic inflammation and the onset of diabetes (<xref ref-type="bibr" rid="B58">58</xref>, <xref ref-type="bibr" rid="B59">59</xref>). While their overall importance was lower, they may still contribute to individual predictions, especially in early screening for complications. Variations in these immune and hematological indicators may offer important early clues in diabetes diagnosis.</p>
<p>Through feature importance analysis, we identified the key predictors for diabetes classification. Physiological features such as glucose, BMI, and age consistently provided high predictive value across datasets, confirming their utility in screening and risk assessment. In addition, Dataset 3 features like urea, triglycerides, and MCV further enhanced the model&#x2019;s capability, especially in predicting diabetes-related complications, thus carrying substantial clinical relevance. These findings provide important interpretability support for the proposed prediction model, helping us understand which features dominate decision-making. By integrating physiological knowledge with feature importance analysis, future diabetes prediction systems can offer more precise early screening and personalized risk evaluation.</p>
</sec>
</sec>
<sec id="S5" sec-type="conclusion">
<title>5 Conclusion</title>
<p>This study proposes an innovative hybrid model that combines convolutional neural networks (CNNs) with ensemble learning methods, significantly improving the accuracy and robustness of diabetes prediction. By combining the deep feature extraction capabilities of CNNs with the advantages of traditional machine learning algorithms, this model performs exceptionally well on three datasets, particularly in handling high-dimensional data and class imbalance issues, demonstrating its strong adaptability and versatility.</p>
<p>Experimental results show that the CNN-Voting Ensemble model outperforms traditional models and standalone ensemble methods across multiple key performance metrics, particularly in terms of accuracy (up to 98%), AUC (0.99), F1 score (0.98), and recall (99%), and achieves the highest MCC across all three datasets (0.56, 0.66, 0.94), reflecting the innovative model&#x2019;s exceptional predictive capability and efficient diagnostic performance. This indicates that the hybrid model not only improves the performance of diabetes prediction but also provides reliable and interpretable decision support for early diagnosis and risk assessment in real clinical settings.</p>
<p>Additionally, feature importance analysis further validates the critical role of clinically relevant biomarkers (such as blood glucose, BMI, age, and urea) in diabetes prediction, enhancing the model&#x2019;s clinical interpretability. The model&#x2019;s high accuracy, stability, and robustness make it a tool with significant clinical application value in diabetes management, particularly when dealing with varying data scales and complexities.</p>
<p>In summary, the hybrid model proposed in this study provides a robust solution for diabetes prediction tasks, significantly outperforming existing methods in terms of accuracy and robustness. Its scalability and interpretability also confer broad clinical application potential, offering new insights for early screening and personalized risk assessment in diabetes management.</p>
</sec>
</body>
<back>
<sec id="S6" sec-type="data-availability">
<title>Data availability statement</title>
<p>The datasets presented in this study can be found in online repositories. The names of the repository/repositories and accession number(s) can be found below: <ext-link ext-link-type="uri" xlink:href="https://archive.ics.uci.edu/">https://archive.ics.uci.edu/</ext-link>, <ext-link ext-link-type="uri" xlink:href="https://tianchi.aliyun.com/competition/entrance/231638/information">https://tianchi.aliyun.com/competition/entrance/231638/information</ext-link>.</p>
</sec>
<sec id="S7" sec-type="ethics-statement">
<title>Ethics statement</title>
<p>Ethical approval was not required for the study involving humans in accordance with the local legislation and institutional requirements. Written informed consent to participate in this study was not required from the participants or the participants&#x2019; legal guardians/next of kin in accordance with the national legislation and the institutional requirements.</p>
</sec>
<sec id="S8" sec-type="author-contributions">
<title>Author contributions</title>
<p>KZ: Conceptualization, Data curation, Software, Writing &#x2013; original draft, Visualization, Writing &#x2013; review &#x0026; editing. CZ: Formal analysis, Investigation, Writing &#x2013; original draft. ZC: Methodology, Writing &#x2013; original draft, Writing &#x2013; review &#x0026; editing. TS: Resources, Validation, Writing &#x2013; review &#x0026; editing. MW: Supervision, Writing &#x2013; review &#x0026; editing.</p>
</sec>
<sec id="S9" sec-type="funding-information">
<title>Funding</title>
<p>The author(s) declare that no financial support was received for the research, and/or publication of this article.</p>
</sec>
<sec id="S10" sec-type="COI-statement">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec id="S11" sec-type="ai-statement">
<title>Generative AI statement</title>
<p>The authors declare that no Generative AI was used in the creation of this manuscript.</p>
<p>Any alternative text (alt text) provided alongside figures in this article has been generated by Frontiers with the support of artificial intelligence and reasonable efforts have been made to ensure accuracy, including review by the authors wherever possible. If you identify any issues, please contact us.</p>
</sec>
<sec id="S12" sec-type="disclaimer">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec id="S13" sec-type="supplementary-material">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fmed.2025.1657889/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fmed.2025.1657889/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="Data_Sheet_1.pdf" id="DS1" mimetype="application/pdf" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1"><label>1.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Khan</surname> <given-names>R</given-names></name> <name><surname>Chua</surname> <given-names>Z</given-names></name> <name><surname>Tan</surname> <given-names>J</given-names></name> <name><surname>Yang</surname> <given-names>Y</given-names></name> <name><surname>Liao</surname> <given-names>Z</given-names></name> <name><surname>Zhao</surname> <given-names>Y</given-names></name></person-group>. <article-title>From pre-diabetes to diabetes: diagnosis, treatments and translational research.</article-title> <source><italic>Medicina.</italic></source> (<year>2019</year>) <volume>55</volume>:<fpage>546</fpage>. <pub-id pub-id-type="doi">10.3390/medicina55090546</pub-id> <pub-id pub-id-type="pmid">31470636</pub-id></citation></ref>
<ref id="B2"><label>2.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Arvind</surname> <given-names>K</given-names></name> <name><surname>Gangwar</surname> <given-names>R</given-names></name> <name><surname>Zargar</surname> <given-names>A</given-names></name> <name><surname>Kumar</surname> <given-names>R</given-names></name> <name><surname>Sharma</surname> <given-names>A</given-names></name></person-group>. <article-title>Prevalence of diabetes in India: a review of IDF diabetes atlas 10th edition.</article-title> <source><italic>Curr Diabetes Rev.</italic></source> (<year>2024</year>) <volume>20</volume>:<fpage>e130423215752</fpage>. <pub-id pub-id-type="doi">10.2174/1573399819666230413094200</pub-id> <pub-id pub-id-type="pmid">37069712</pub-id></citation></ref>
<ref id="B3"><label>3.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Demir</surname> <given-names>S</given-names></name> <name><surname>Nawroth</surname> <given-names>P</given-names></name> <name><surname>Herzig</surname> <given-names>S</given-names></name> <name><surname>Ekim &#x00DC;st&#x00FC;nel</surname> <given-names>B</given-names></name></person-group>. <article-title>Emerging targets in type 2 diabetes and diabetic complications.</article-title> <source><italic>Adv Sci.</italic></source> (<year>2021</year>) <volume>8</volume>:<fpage>e2100275</fpage>. <pub-id pub-id-type="doi">10.1002/advs.202100275</pub-id> <pub-id pub-id-type="pmid">34319011</pub-id></citation></ref>
<ref id="B4"><label>4.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Eid</surname> <given-names>S</given-names></name> <name><surname>Sas</surname> <given-names>K</given-names></name> <name><surname>Abcouwer</surname> <given-names>S</given-names></name> <name><surname>Feldman</surname> <given-names>E</given-names></name> <name><surname>Gardner</surname> <given-names>T</given-names></name> <name><surname>Pennathur</surname> <given-names>S</given-names></name><etal/></person-group> <article-title>New insights into the mechanisms of diabetic complications: role of lipids and lipid metabolism.</article-title> <source><italic>Diabetologia.</italic></source> (<year>2019</year>) <volume>62</volume>:<fpage>1539</fpage>&#x2013;<lpage>49</lpage>. <pub-id pub-id-type="doi">10.1007/s00125-019-4959-1</pub-id> <pub-id pub-id-type="pmid">31346658</pub-id></citation></ref>
<ref id="B5"><label>5.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Khalil</surname> <given-names>H</given-names></name></person-group>. <article-title>Diabetes microvascular complications&#x2013;a clinical update.</article-title> <source><italic>Diabetes Metab Syndr.</italic></source> (<year>2017</year>) <volume>11</volume>:<fpage>S133</fpage>&#x2013;<lpage>9</lpage>. <pub-id pub-id-type="doi">10.1016/j.dsx.2016.12.022</pub-id> <pub-id pub-id-type="pmid">27993541</pub-id></citation></ref>
<ref id="B6"><label>6.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lindstr&#x00F6;m</surname> <given-names>J</given-names></name> <name><surname>Louheranta</surname> <given-names>A</given-names></name> <name><surname>Mannelin</surname> <given-names>M</given-names></name> <name><surname>Rastas</surname> <given-names>M</given-names></name> <name><surname>Salminen</surname> <given-names>V</given-names></name> <name><surname>Eriksson</surname> <given-names>J</given-names></name><etal/></person-group> <article-title>The Finnish diabetes prevention study (DPS): lifestyle intervention and 3-year results on diet and physical activity.</article-title> <source><italic>Diabetes Care.</italic></source> (<year>2003</year>) <volume>26</volume>:<fpage>3230</fpage>&#x2013;<lpage>6</lpage>. <pub-id pub-id-type="doi">10.2337/diacare.26.12.3230</pub-id> <pub-id pub-id-type="pmid">14633807</pub-id></citation></ref>
<ref id="B7"><label>7.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Waugh</surname> <given-names>N</given-names></name> <name><surname>Scotland</surname> <given-names>G</given-names></name> <name><surname>McNamee</surname> <given-names>P</given-names></name> <name><surname>Gillett</surname> <given-names>M</given-names></name> <name><surname>Brennan</surname> <given-names>A</given-names></name> <name><surname>Goyder</surname> <given-names>E</given-names></name><etal/></person-group> <article-title>Screening for type 2 diabetes: literature review and economic modelling.</article-title> <source><italic>Health Technol Assess.</italic></source> (<year>2007</year>) <volume>11</volume>:<fpage>iii</fpage>&#x2013;<lpage>iv, ix&#x2013;xi, 1&#x2013;125</lpage>. <pub-id pub-id-type="doi">10.3310/hta11170</pub-id> <pub-id pub-id-type="pmid">17462167</pub-id></citation></ref>
<ref id="B8"><label>8.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kaur</surname> <given-names>G</given-names></name> <name><surname>Lakshmi</surname> <given-names>P</given-names></name> <name><surname>Rastogi</surname> <given-names>A</given-names></name> <name><surname>Bhansali</surname> <given-names>A</given-names></name> <name><surname>Jain</surname> <given-names>S</given-names></name> <name><surname>Teerawattananon</surname> <given-names>Y</given-names></name><etal/></person-group> <article-title>Diagnostic accuracy of tests for type 2 diabetes and prediabetes: a systematic review and meta-analysis.</article-title> <source><italic>PLoS One.</italic></source> (<year>2020</year>) <volume>15</volume>:<fpage>e0242415</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0242415</pub-id> <pub-id pub-id-type="pmid">33216783</pub-id></citation></ref>
<ref id="B9"><label>9.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Deberneh</surname> <given-names>H</given-names></name> <name><surname>Kim</surname> <given-names>I</given-names></name></person-group>. <article-title>Prediction of type 2 diabetes based on machine learning algorithm.</article-title> <source><italic>Int J Environ Res Public Health.</italic></source> (<year>2021</year>) <volume>18</volume>:<fpage>3317</fpage>. <pub-id pub-id-type="doi">10.3390/ijerph18063317</pub-id> <pub-id pub-id-type="pmid">33806973</pub-id></citation></ref>
<ref id="B10"><label>10.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Olisah</surname> <given-names>C</given-names></name> <name><surname>Smith</surname> <given-names>L</given-names></name> <name><surname>Smith</surname> <given-names>M</given-names></name></person-group>. <article-title>Diabetes mellitus prediction and diagnosis from a data preprocessing and machine learning perspective.</article-title> <source><italic>Comput Methods Programs Biomed.</italic></source> (<year>2022</year>) <volume>220</volume>:<fpage>106773</fpage>. <pub-id pub-id-type="doi">10.1016/j.cmpb.2022.106773</pub-id> <pub-id pub-id-type="pmid">35429810</pub-id></citation></ref>
<ref id="B11"><label>11.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lopez-Arevalo</surname> <given-names>I</given-names></name> <name><surname>Aldana-Bobadilla</surname> <given-names>E</given-names></name> <name><surname>Molina-Villegas</surname> <given-names>A</given-names></name> <name><surname>Galeana-Zapi&#x00E9;n</surname> <given-names>H</given-names></name> <name><surname>Mu&#x00F1;iz-Sanchez</surname> <given-names>V</given-names></name> <name><surname>Gausin-Valle</surname> <given-names>S</given-names></name></person-group>. <article-title>A memory-efficient encoding method for processing mixed-type data on machine learning.</article-title> <source><italic>Entropy.</italic></source> (<year>2020</year>) <volume>22</volume>:<fpage>1391</fpage>. <pub-id pub-id-type="doi">10.3390/e22121391</pub-id> <pub-id pub-id-type="pmid">33316972</pub-id></citation></ref>
<ref id="B12"><label>12.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Dahouda</surname> <given-names>MK</given-names></name> <name><surname>Joe</surname> <given-names>I</given-names></name></person-group>. <article-title>A deep-learned embedding technique for categorical features encoding.</article-title> <source><italic>IEEE Access.</italic></source> (<year>2021</year>) <volume>9</volume>:<fpage>114381</fpage>&#x2013;<lpage>91</lpage>. <pub-id pub-id-type="doi">10.1109/ACCESS.2021.3104357</pub-id></citation></ref>
<ref id="B13"><label>13.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Dinh</surname> <given-names>A</given-names></name> <name><surname>Miertschin</surname> <given-names>S</given-names></name> <name><surname>Young</surname> <given-names>A</given-names></name> <name><surname>Mohanty</surname> <given-names>SD</given-names></name></person-group>. <article-title>A data-driven approach to predicting diabetes and cardiovascular disease with machine learning.</article-title> <source><italic>BMC Med Inform Decis Mak.</italic></source> (<year>2019</year>) <volume>19</volume>:<fpage>211</fpage>. <pub-id pub-id-type="doi">10.1186/s12911-019-0918-5</pub-id> <pub-id pub-id-type="pmid">31694707</pub-id></citation></ref>
<ref id="B14"><label>14.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Starovoitov</surname> <given-names>V</given-names></name> <name><surname>Golub</surname> <given-names>Y</given-names></name></person-group>. <article-title>Data normalization in machine learning.</article-title> <source><italic>Informatics.</italic></source> (<year>2021</year>) <volume>18</volume>:<fpage>83</fpage>&#x2013;<lpage>96</lpage>. <pub-id pub-id-type="doi">10.37661/1816-0301-2021-18-3-83-96</pub-id></citation></ref>
<ref id="B15"><label>15.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Singh</surname> <given-names>D</given-names></name> <name><surname>Singh</surname> <given-names>B</given-names></name></person-group>. <article-title>Investigating the impact of data normalization on classification performance.</article-title> <source><italic>Appl Soft Comput.</italic></source> (<year>2020</year>) <volume>97</volume>:<fpage>105524</fpage>. <pub-id pub-id-type="doi">10.1016/J.ASOC.2019.105524</pub-id></citation></ref>
<ref id="B16"><label>16.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Fern&#x00E1;ndez</surname> <given-names>A</given-names></name> <name><surname>Garcia</surname> <given-names>S</given-names></name> <name><surname>Herrera</surname> <given-names>F</given-names></name> <name><surname>Chawla</surname> <given-names>NV</given-names></name></person-group>. <article-title>SMOTE for learning from imbalanced data: progress and challenges, marking the 15-year anniversary.</article-title> <source><italic>J Artif Intell Res.</italic></source> (<year>2018</year>) <volume>61</volume>:<fpage>863</fpage>&#x2013;<lpage>905</lpage>. <pub-id pub-id-type="doi">10.1613/jair.1.11192</pub-id></citation></ref>
<ref id="B17"><label>17.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Shipe</surname> <given-names>M</given-names></name> <name><surname>Deppen</surname> <given-names>S</given-names></name> <name><surname>Farjah</surname> <given-names>F</given-names></name> <name><surname>Grogan</surname> <given-names>E</given-names></name></person-group>. <article-title>Developing prediction models for clinical use using logistic regression: an overview.</article-title> <source><italic>J Thorac Dis.</italic></source> (<year>2019</year>) <volume>11</volume>:<fpage>S574</fpage>&#x2013;<lpage>84</lpage>. <pub-id pub-id-type="doi">10.21037/jtd.2019.01.25</pub-id> <pub-id pub-id-type="pmid">31032076</pub-id></citation></ref>
<ref id="B18"><label>18.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Singamsetty</surname> <given-names>S</given-names></name> <name><surname>Ghanta</surname> <given-names>S</given-names></name> <name><surname>Biswas</surname> <given-names>S</given-names></name> <name><surname>Pradhan</surname> <given-names>A</given-names></name></person-group>. <article-title>Enhancing machine learning-based forecasting of chronic renal disease with explainable AI.</article-title> <source><italic>PeerJ Comput Sci.</italic></source> (<year>2024</year>) <volume>10</volume>:<fpage>e2291</fpage>. <pub-id pub-id-type="doi">10.7717/peerj-cs.2291</pub-id> <pub-id pub-id-type="pmid">39650439</pub-id></citation></ref>
<ref id="B19"><label>19.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lee</surname> <given-names>H</given-names></name> <name><surname>Lee</surname> <given-names>E</given-names></name> <name><surname>Ham</surname> <given-names>S</given-names></name> <name><surname>Lee</surname> <given-names>H</given-names></name> <name><surname>Lee</surname> <given-names>J</given-names></name> <name><surname>Kwon</surname> <given-names>S</given-names></name><etal/></person-group> <article-title>Machine learning approach to identify stroke within 4.5 hours.</article-title> <source><italic>Stroke.</italic></source> (<year>2020</year>) <volume>51</volume>:<fpage>860</fpage>&#x2013;<lpage>6</lpage>. <pub-id pub-id-type="doi">10.1161/STROKEAHA.119.027611</pub-id> <pub-id pub-id-type="pmid">31987014</pub-id></citation></ref>
<ref id="B20"><label>20.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zabor</surname> <given-names>E</given-names></name> <name><surname>Reddy</surname> <given-names>C</given-names></name> <name><surname>Tendulkar</surname> <given-names>R</given-names></name> <name><surname>Patil</surname> <given-names>S</given-names></name></person-group>. <article-title>Logistic regression in clinical studies.</article-title> <source><italic>Int J Radiat Oncol Biol Phys.</italic></source> (<year>2022</year>) <volume>112</volume>:<fpage>271</fpage>&#x2013;<lpage>7</lpage>. <pub-id pub-id-type="doi">10.1016/j.ijrobp.2021.08.007</pub-id> <pub-id pub-id-type="pmid">34416341</pub-id></citation></ref>
<ref id="B21"><label>21.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ali</surname> <given-names>L</given-names></name> <name><surname>Wajahat</surname> <given-names>I</given-names></name> <name><surname>Amiri Golilarz</surname> <given-names>N</given-names></name></person-group>. <article-title>LDA&#x2013;GA&#x2013;SVM: improved hepatocellular carcinoma prediction through dimensionality reduction and genetically optimized support vector machine.</article-title> <source><italic>Neural Comput Appl.</italic></source> (<year>2020</year>) <volume>33</volume>:<fpage>2783</fpage>&#x2013;<lpage>92</lpage>. <pub-id pub-id-type="doi">10.1007/s00521-020-05157-2</pub-id></citation></ref>
<ref id="B22"><label>22.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ozer</surname> <given-names>M</given-names></name> <name><surname>Sarica</surname> <given-names>P</given-names></name> <name><surname>Arga</surname> <given-names>K</given-names></name></person-group>. <article-title>New machine learning applications to accelerate personalized medicine in breast cancer: rise of the support vector machines.</article-title> <source><italic>OMICS.</italic></source> (<year>2020</year>) <volume>24</volume>:<fpage>241</fpage>&#x2013;<lpage>6</lpage>. <pub-id pub-id-type="doi">10.1089/omi.2020.0001</pub-id> <pub-id pub-id-type="pmid">32228365</pub-id></citation></ref>
<ref id="B23"><label>23.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Islam</surname> <given-names>MM</given-names></name> <name><surname>Haque</surname> <given-names>MR</given-names></name> <name><surname>Iqbal</surname> <given-names>H</given-names></name> <name><surname>Hasan</surname> <given-names>M</given-names></name> <name><surname>Hasan</surname> <given-names>M</given-names></name> <name><surname>Kabir</surname> <given-names>M</given-names></name></person-group>. <article-title>Breast cancer prediction: a comparative study using machine learning techniques.</article-title> <source><italic>SN Comput Sci.</italic></source> (<year>2020</year>) <volume>1</volume>:<fpage>290</fpage>. <pub-id pub-id-type="doi">10.1007/s42979-020-00305-w</pub-id></citation></ref>
<ref id="B24"><label>24.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>James</surname> <given-names>G</given-names></name> <name><surname>Witten</surname> <given-names>D</given-names></name> <name><surname>Hastie</surname> <given-names>T</given-names></name> <name><surname>Tibshirani</surname> <given-names>R.</given-names></name></person-group> <source><italic>An introduction to statistical learning.</italic></source> (<volume>Vol. 112</volume>). <publisher-loc>New York, NY</publisher-loc>: <publisher-name>Springer</publisher-name> (<year>2013</year>).</citation></ref>
<ref id="B25"><label>25.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sosa-Hern&#x00E1;ndez</surname> <given-names>V</given-names></name> <name><surname>Monroy</surname> <given-names>R</given-names></name> <name><surname>Medina-P&#x00E9;rez</surname> <given-names>MA</given-names></name> <name><surname>Loyola-Gonz&#x00E1;lez</surname> <given-names>O</given-names></name> <name><surname>Herrera</surname> <given-names>F</given-names></name></person-group>. <article-title>A practical tutorial for decision tree induction.</article-title> <source><italic>ACM Comput Surv.</italic></source> (<year>2021</year>) <volume>54</volume>:<fpage>1</fpage>&#x2013;<lpage>38</lpage>. <pub-id pub-id-type="doi">10.1145/3429739</pub-id></citation></ref>
<ref id="B26"><label>26.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mienye</surname> <given-names>ID</given-names></name> <name><surname>Jere</surname> <given-names>N</given-names></name></person-group>. <article-title>A survey of decision trees: concepts, algorithms, and applications.</article-title> <source><italic>IEEE Access.</italic></source> (<year>2024</year>) <volume>12</volume>:<fpage>86716</fpage>&#x2013;<lpage>27</lpage>. <pub-id pub-id-type="doi">10.1109/ACCESS.2024.3416838</pub-id></citation></ref>
<ref id="B27"><label>27.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Alghowinem</surname> <given-names>S</given-names></name> <name><surname>Gedeon</surname> <given-names>T</given-names></name> <name><surname>Goecke</surname> <given-names>R</given-names></name> <name><surname>Cohn</surname> <given-names>J</given-names></name> <name><surname>Parker</surname> <given-names>G</given-names></name></person-group>. <article-title>Interpretation of depression detection models via feature selection methods.</article-title> <source><italic>IEEE Trans Affect Comput.</italic></source> (<year>2023</year>) <volume>14</volume>:<fpage>133</fpage>&#x2013;<lpage>52</lpage>. <pub-id pub-id-type="doi">10.1109/taffc.2020.3035535</pub-id> <pub-id pub-id-type="pmid">36938342</pub-id></citation></ref>
<ref id="B28"><label>28.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Roe</surname> <given-names>K</given-names></name> <name><surname>Jawa</surname> <given-names>V</given-names></name> <name><surname>Zhang</surname> <given-names>X</given-names></name> <name><surname>Chute</surname> <given-names>C</given-names></name> <name><surname>Epstein</surname> <given-names>J</given-names></name> <name><surname>Matelsky</surname> <given-names>J</given-names></name><etal/></person-group> <article-title>Feature engineering with clinical expert knowledge: a case study assessment of machine learning model complexity and performance.</article-title> <source><italic>PLoS One.</italic></source> (<year>2020</year>) <volume>15</volume>:<fpage>e0231300</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0231300</pub-id> <pub-id pub-id-type="pmid">32324754</pub-id></citation></ref>
<ref id="B29"><label>29.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Figueroa Barraza</surname> <given-names>J</given-names></name> <name><surname>L&#x00F3;pez Droguett</surname> <given-names>E</given-names></name> <name><surname>Martins</surname> <given-names>M</given-names></name></person-group>. <article-title>Towards interpretable deep learning: a feature selection framework for prognostics and health management using deep neural networks.</article-title> <source><italic>Sensors.</italic></source> (<year>2021</year>) <volume>21</volume>:<fpage>5888</fpage>. <pub-id pub-id-type="doi">10.3390/s21175888</pub-id> <pub-id pub-id-type="pmid">34502778</pub-id></citation></ref>
<ref id="B30"><label>30.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Li</surname> <given-names>K</given-names></name> <name><surname>Wang</surname> <given-names>F</given-names></name> <name><surname>Yang</surname> <given-names>L</given-names></name></person-group>. <article-title>Deep feature screening: feature selection for ultra-high-dimensional data via deep neural networks.</article-title> <source><italic>Neurocomputing.</italic></source> (<year>2022</year>) <volume>538</volume>:<fpage>126186</fpage>. <pub-id pub-id-type="doi">10.1016/j.neucom.2023.03.047</pub-id></citation></ref>
<ref id="B31"><label>31.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kleiman</surname> <given-names>M</given-names></name> <name><surname>Barenholtz</surname> <given-names>E</given-names></name> <name><surname>Galvin</surname> <given-names>J</given-names></name></person-group>. <article-title>Screening for early-stage Alzheimer&#x2019;s disease using optimized feature sets and machine learning.</article-title> <source><italic>J Alzheimers Dis.</italic></source> (<year>2020</year>) <volume>81</volume>:<fpage>355</fpage>&#x2013;<lpage>66</lpage>. <pub-id pub-id-type="doi">10.3233/JAD-201377</pub-id> <pub-id pub-id-type="pmid">33780367</pub-id></citation></ref>
<ref id="B32"><label>32.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chakraborty</surname> <given-names>C</given-names></name> <name><surname>Kishor</surname> <given-names>A</given-names></name> <name><surname>Rodrigues</surname> <given-names>J</given-names></name></person-group>. <article-title>Novel enhanced-grey wolf optimization hybrid machine learning technique for biomedical data computation.</article-title> <source><italic>Comput Electr Eng.</italic></source> (<year>2022</year>) <volume>99</volume>:<fpage>107778</fpage>. <pub-id pub-id-type="doi">10.1016/j.compeleceng.2022.107778</pub-id></citation></ref>
<ref id="B33"><label>33.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mienye</surname> <given-names>ID</given-names></name> <name><surname>Sun</surname> <given-names>Y</given-names></name></person-group>. <article-title>A survey of ensemble learning: concepts, algorithms, applications, and prospects.</article-title> <source><italic>IEEE Access.</italic></source> (<year>2022</year>) <volume>10</volume>:<fpage>99129</fpage>&#x2013;<lpage>49</lpage>. <pub-id pub-id-type="doi">10.1109/ACCESS.2022.3207287</pub-id></citation></ref>
<ref id="B34"><label>34.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Schonlau</surname> <given-names>M</given-names></name> <name><surname>Zou</surname> <given-names>RY</given-names></name></person-group>. <article-title>The random forest algorithm for statistical learning.</article-title> <source><italic>Stata J.</italic></source> (<year>2020</year>) <volume>20</volume>:<fpage>29</fpage>&#x2013;<lpage>33</lpage>. <pub-id pub-id-type="doi">10.1177/1536867X20909688</pub-id></citation></ref>
<ref id="B35"><label>35.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yagin</surname> <given-names>B</given-names></name> <name><surname>Yagin</surname> <given-names>F</given-names></name> <name><surname>Colak</surname> <given-names>C</given-names></name> <name><surname>Inceoglu</surname> <given-names>F</given-names></name> <name><surname>Kadry</surname> <given-names>S</given-names></name> <name><surname>Kim</surname> <given-names>J</given-names></name></person-group>. <article-title>Cancer metastasis prediction and genomic biomarker identification through machine learning and eXplainable artificial intelligence in breast cancer research.</article-title> <source><italic>Diagnostics.</italic></source> (<year>2023</year>) <volume>13</volume>:<fpage>3314</fpage>. <pub-id pub-id-type="doi">10.3390/diagnostics13213314</pub-id> <pub-id pub-id-type="pmid">37958210</pub-id></citation></ref>
<ref id="B36"><label>36.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bent&#x00E9;jac</surname> <given-names>C</given-names></name> <name><surname>Cs&#x00F6;rgo</surname> <given-names>A</given-names></name> <name><surname>Mart&#x00ED;nez-Mu&#x00F1;oz</surname> <given-names>G</given-names></name></person-group>. <article-title>A comparative analysis of gradient boosting algorithms.</article-title> <source><italic>Artif Intell Rev.</italic></source> (<year>2019</year>) <volume>54</volume>:<fpage>1937</fpage>&#x2013;<lpage>67</lpage>. <pub-id pub-id-type="doi">10.1007/s10462-020-09896-5</pub-id></citation></ref>
<ref id="B37"><label>37.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Iwendi</surname> <given-names>C</given-names></name> <name><surname>Bashir</surname> <given-names>A</given-names></name> <name><surname>Peshkar</surname> <given-names>A</given-names></name> <name><surname>Sujatha</surname> <given-names>R</given-names></name> <name><surname>Chatterjee</surname> <given-names>J</given-names></name> <name><surname>Pasupuleti</surname> <given-names>S</given-names></name><etal/></person-group> <article-title>COVID-19 patient health prediction using boosted random forest algorithm.</article-title> <source><italic>Front Public Health.</italic></source> (<year>2020</year>) <volume>8</volume>:<fpage>357</fpage>. <pub-id pub-id-type="doi">10.3389/fpubh.2020.00357</pub-id> <pub-id pub-id-type="pmid">32719767</pub-id></citation></ref>
<ref id="B38"><label>38.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sherazi</surname> <given-names>S</given-names></name> <name><surname>Bae</surname> <given-names>J</given-names></name> <name><surname>Lee</surname> <given-names>JY</given-names></name></person-group>. <article-title>A soft voting ensemble classifier for early prediction and diagnosis of occurrences of major adverse cardiovascular events for STEMI and NSTEMI during 2-year follow-up in patients with acute coronary syndrome.</article-title> <source><italic>PLoS One.</italic></source> (<year>2021</year>) <volume>16</volume>:<fpage>e0249338</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0249338</pub-id> <pub-id pub-id-type="pmid">34115750</pub-id></citation></ref>
<ref id="B39"><label>39.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Moreno-Seco</surname> <given-names>F</given-names></name> <name><surname>I&#x00F1;esta</surname> <given-names>JM</given-names></name> <name><surname>Ponce de Le&#x00F3;n</surname> <given-names>PJ</given-names></name> <name><surname>Mic&#x00F3;</surname> <given-names>L.</given-names></name></person-group> <source><italic>Comparison of Classifier Fusion Methods for Classification in Pattern Recognition Tasks: Structural, Syntactic, and Statistical Pattern Recognition.</italic></source> <publisher-loc>Berlin, Heidelberg</publisher-loc>: <publisher-name>Springer Berlin Heidelberg</publisher-name> (<year>2006</year>).</citation></ref>
<ref id="B40"><label>40.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Khan</surname> <given-names>A</given-names></name> <name><surname>Sohail</surname> <given-names>A</given-names></name> <name><surname>Zahoora</surname> <given-names>U</given-names></name></person-group>. <article-title>A survey of the recent architectures of deep convolutional neural networks.</article-title> <source><italic>Artif Intell Rev.</italic></source> (<year>2019</year>) <volume>53</volume>:<fpage>5455</fpage>&#x2013;<lpage>516</lpage>. <pub-id pub-id-type="doi">10.1007/s10462-020-09825-6</pub-id></citation></ref>
<ref id="B41"><label>41.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Jia</surname> <given-names>D</given-names></name> <name><surname>Li</surname> <given-names>Z</given-names></name> <name><surname>Zhang</surname> <given-names>C</given-names></name></person-group>. <article-title>Detection of cervical cancer cells based on strong feature CNN-SVM network.</article-title> <source><italic>Neurocomputing.</italic></source> (<year>2020</year>) <volume>411</volume>:<fpage>112</fpage>&#x2013;<lpage>27</lpage>. <pub-id pub-id-type="doi">10.1016/j.neucom.2020.06.006</pub-id></citation></ref>
<ref id="B42"><label>42.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Rainio</surname> <given-names>O</given-names></name> <name><surname>Teuho</surname> <given-names>J</given-names></name> <name><surname>Kl&#x00E9;n</surname> <given-names>R</given-names></name></person-group>. <article-title>Evaluation metrics and statistical tests for machine learning.</article-title> <source><italic>Sci Rep.</italic></source> (<year>2024</year>) <volume>14</volume>:<fpage>6086</fpage>. <pub-id pub-id-type="doi">10.1038/s41598-024-56706-x</pub-id> <pub-id pub-id-type="pmid">38480847</pub-id></citation></ref>
<ref id="B43"><label>43.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhu</surname> <given-names>Q</given-names></name></person-group>. <article-title>On the performance of Matthews correlation coefficient (MCC) for imbalanced dataset.</article-title> <source><italic>Pattern Recognit Lett.</italic></source> (<year>2020</year>) <volume>136</volume>:<fpage>71</fpage>&#x2013;<lpage>80</lpage>. <pub-id pub-id-type="doi">10.1016/j.patrec.2020.03.030</pub-id></citation></ref>
<ref id="B44"><label>44.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Itaya</surname> <given-names>Y</given-names></name> <name><surname>Tamura</surname> <given-names>J</given-names></name> <name><surname>Hayashi</surname> <given-names>K</given-names></name> <name><surname>Yamamoto</surname> <given-names>K</given-names></name></person-group>. <article-title>Asymptotic properties of matthews correlation coefficient.</article-title> <source><italic>Stat Med.</italic></source> (<year>2025</year>) <volume>44</volume>:<fpage>e10303</fpage>. <pub-id pub-id-type="doi">10.1002/sim.10303</pub-id> <pub-id pub-id-type="pmid">39682035</pub-id></citation></ref>
<ref id="B45"><label>45.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Satyanarayana Raju</surname> <given-names>P</given-names></name> <name><surname>Pyda Vijaya Radhika</surname> <given-names>CH</given-names></name> <name><surname>Srinivas</surname> <given-names>BS</given-names></name> <name><surname>Vaish</surname> <given-names>R</given-names></name> <name><surname>Usha Rani</surname> <given-names>P</given-names></name></person-group>. <article-title>Assessing the impact of body mass index on insulin resistance and metabolic risk factors in pre-diabetic individuals: a comprehensive cross-sectional study.</article-title> <source><italic>Asian J Med Sci.</italic></source> (<year>2024</year>) <volume>15</volume>:<fpage>77</fpage>&#x2013;<lpage>81</lpage>. <pub-id pub-id-type="doi">10.3126/ajms.v15i5.62793</pub-id></citation></ref>
<ref id="B46"><label>46.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Maniyara</surname> <given-names>K</given-names></name> <name><surname>Kodali</surname> <given-names>P</given-names></name></person-group>. <article-title>Assessing type-2 diabetes risk based on the Indian diabetes risk score among adults aged 45 and above in India.</article-title> <source><italic>Sci Rep.</italic></source> (<year>2025</year>) <volume>15</volume>:<fpage>4495</fpage>. <pub-id pub-id-type="doi">10.1038/s41598-025-88460-z</pub-id> <pub-id pub-id-type="pmid">39915651</pub-id></citation></ref>
<ref id="B47"><label>47.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hezam</surname> <given-names>A</given-names></name> <name><surname>Shaghdar</surname> <given-names>H</given-names></name> <name><surname>Chen</surname> <given-names>L</given-names></name></person-group>. <article-title>The connection between hypertension and diabetes and their role in heart and kidney disease development.</article-title> <source><italic>J Res Med Sci.</italic></source> (<year>2024</year>) <volume>29</volume>:<fpage>22</fpage>. <pub-id pub-id-type="doi">10.4103/jrms.jrms_470_23</pub-id> <pub-id pub-id-type="pmid">38855561</pub-id></citation></ref>
<ref id="B48"><label>48.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kumar</surname> <given-names>P</given-names></name> <name><surname>Kumar</surname> <given-names>A</given-names></name> <name><surname>Raj</surname> <given-names>R</given-names></name></person-group>. <article-title>Comparative study: correlation of urea and serum creatinine with duration of diabetes and glycemic index in individuals with type 1 and 2 diabetes mellitus.</article-title> <source><italic>Students J Health Res Afr.</italic></source> (<year>2023</year>) <volume>4</volume>:<fpage>6</fpage>. <pub-id pub-id-type="doi">10.51168/sjhrafrica.v4i12.830</pub-id></citation></ref>
<ref id="B49"><label>49.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bonet</surname> <given-names>J</given-names></name> <name><surname>Yadav</surname> <given-names>Y</given-names></name> <name><surname>Miles</surname> <given-names>J</given-names></name> <name><surname>Basu</surname> <given-names>A</given-names></name> <name><surname>Cobelli</surname> <given-names>C</given-names></name> <name><surname>Basu</surname> <given-names>R</given-names></name><etal/></person-group> <article-title>A new oral model of free fatty acid kinetics to assess lipolysis in subjects with and without type 2 diabetes.</article-title> <source><italic>Am J Physiol Endocrinol Metab.</italic></source> (<year>2023</year>) <volume>325</volume>:<fpage>E163</fpage>&#x2013;<lpage>70</lpage>. <pub-id pub-id-type="doi">10.1152/ajpendo.00091.2023</pub-id> <pub-id pub-id-type="pmid">37378622</pub-id></citation></ref>
<ref id="B50"><label>50.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Levita</surname> <given-names>J</given-names></name> <name><surname>Sumiwi</surname> <given-names>S</given-names></name> <name><surname>Elkanawati</surname> <given-names>R</given-names></name></person-group>. <article-title>Impact of lipids on insulin resistance: insights from human and animal studies.</article-title> <source><italic>Drug Design Dev Ther.</italic></source> (<year>2024</year>) <volume>18</volume>:<fpage>3337</fpage>&#x2013;<lpage>60</lpage>. <pub-id pub-id-type="doi">10.2147/DDDT.S468147</pub-id> <pub-id pub-id-type="pmid">39100221</pub-id></citation></ref>
<ref id="B51"><label>51.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Dumont</surname> <given-names>B</given-names></name> <name><surname>Neagoe</surname> <given-names>P</given-names></name> <name><surname>Charles</surname> <given-names>E</given-names></name> <name><surname>Villeneuve</surname> <given-names>L</given-names></name> <name><surname>Tardif</surname> <given-names>J</given-names></name> <name><surname>R&#x00E4;kel</surname> <given-names>A</given-names></name><etal/></person-group> <article-title>Low-density neutrophils contribute to subclinical inflammation in patients with type 2 diabetes.</article-title> <source><italic>Int J Mol Sci.</italic></source> (<year>2024</year>) <volume>25</volume>:<fpage>1674</fpage>. <pub-id pub-id-type="doi">10.3390/ijms25031674</pub-id> <pub-id pub-id-type="pmid">38338951</pub-id></citation></ref>
<ref id="B52"><label>52.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Nigi</surname> <given-names>L</given-names></name> <name><surname>Pedace</surname> <given-names>E</given-names></name> <name><surname>Dotta</surname> <given-names>F</given-names></name> <name><surname>Sebastiani</surname> <given-names>G</given-names></name></person-group>. <article-title>Neutrophils in type 1 diabetes: untangling the intricate web of pathways and hypothesis.</article-title> <source><italic>Biomolecules.</italic></source> (<year>2025</year>) <volume>15</volume>:<fpage>505</fpage>. <pub-id pub-id-type="doi">10.3390/biom15040505</pub-id> <pub-id pub-id-type="pmid">40305198</pub-id></citation></ref>
<ref id="B53"><label>53.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Li</surname> <given-names>H</given-names></name> <name><surname>Xu</surname> <given-names>Y</given-names></name> <name><surname>Fan</surname> <given-names>S</given-names></name> <name><surname>Wang</surname> <given-names>Z</given-names></name> <name><surname>Chen</surname> <given-names>H</given-names></name> <name><surname>Zhang</surname> <given-names>L</given-names></name><etal/></person-group> <article-title>Association between neutrophil-percentage-to-albumin ratio and diabetic kidney disease in type 2 diabetes mellitus patients: a cross-sectional study from NHANES 2009-2018.</article-title> <source><italic>Front Endocrinol.</italic></source> (<year>2025</year>) <volume>16</volume>:<fpage>1552772</fpage>. <pub-id pub-id-type="doi">10.3389/fendo.2025.1552772</pub-id> <pub-id pub-id-type="pmid">40115740</pub-id></citation></ref>
<ref id="B54"><label>54.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Floyd</surname> <given-names>J</given-names></name> <name><surname>Prasad</surname> <given-names>R</given-names></name> <name><surname>Dupont</surname> <given-names>M</given-names></name> <name><surname>Adu-Rutledge</surname> <given-names>Y</given-names></name> <name><surname>Anshumali</surname> <given-names>S</given-names></name> <name><surname>Paul</surname> <given-names>S</given-names></name><etal/></person-group> <article-title>Intestinal neutrophil extracellular traps promote gut barrier damage exacerbating endotoxaemia, systemic inflammation and progression of diabetic retinopathy in type 2 diabetes.</article-title> <source><italic>Diabetologia.</italic></source> (<year>2025</year>) <volume>68</volume>:<fpage>866</fpage>&#x2013;<lpage>89</lpage>. <pub-id pub-id-type="doi">10.1007/s00125-024-06349-4</pub-id> <pub-id pub-id-type="pmid">39875729</pub-id></citation></ref>
<ref id="B55"><label>55.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Siddiqui</surname> <given-names>N</given-names></name> <name><surname>Narang</surname> <given-names>S</given-names></name> <name><surname>Aggarwal</surname> <given-names>A</given-names></name> <name><surname>Gupta</surname> <given-names>R</given-names></name> <name><surname>Goel</surname> <given-names>V</given-names></name></person-group>. <article-title>Immature platelet fraction and other platelet indices in type 2 diabetes mellitus.</article-title> <source><italic>Cureus.</italic></source> (<year>2025</year>) <volume>17</volume>:<fpage>e79093</fpage>. <pub-id pub-id-type="doi">10.7759/cureus.79093</pub-id> <pub-id pub-id-type="pmid">40104479</pub-id></citation></ref>
<ref id="B56"><label>56.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Jena</surname> <given-names>S</given-names></name> <name><surname>Raizada</surname> <given-names>N</given-names></name> <name><surname>Kalra</surname> <given-names>S</given-names></name> <name><surname>Bhattacharya</surname> <given-names>S</given-names></name></person-group>. <article-title>Platelet indices as predictors of glycaemic status and complications in diabetes mellitus.</article-title> <source><italic>Apollo Med.</italic></source> (<year>2025</year>) <volume>22</volume>:<fpage>214</fpage>&#x2013;<lpage>9</lpage>. <pub-id pub-id-type="doi">10.1177/09760016251317265</pub-id></citation></ref>
<ref id="B57"><label>57.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chaudhary</surname> <given-names>S</given-names></name> <name><surname>Kausar</surname> <given-names>Z</given-names></name> <name><surname>Khan</surname> <given-names>R</given-names></name> <name><surname>Farhan</surname> <given-names>E</given-names></name></person-group>. <article-title>Association of plateletcrit value with gestational diabetes mellitus: a case control study in a tertiary care setting.</article-title> <source><italic>Pak J Health Sci.</italic></source> (<year>2025</year>) <volume>6</volume>:<fpage>228</fpage>&#x2013;<lpage>32</lpage>. <pub-id pub-id-type="doi">10.54393/pjhs.v6i1.2655</pub-id></citation></ref>
<ref id="B58"><label>58.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Peng</surname> <given-names>Y</given-names></name> <name><surname>Yin</surname> <given-names>H</given-names></name> <name><surname>Hu</surname> <given-names>L</given-names></name> <name><surname>Fang</surname> <given-names>L</given-names></name> <name><surname>Jia</surname> <given-names>D</given-names></name> <name><surname>Li</surname> <given-names>L</given-names></name></person-group>. <article-title>White blood cell count is associated with hyperuricemia in patients with type 2 diabetes mellitus.</article-title> <source><italic>J Inflamm Res.</italic></source> (<year>2025</year>) <volume>18</volume>:<fpage>3993</fpage>&#x2013;<lpage>9</lpage>. <pub-id pub-id-type="doi">10.2147/JIR.S501890</pub-id> <pub-id pub-id-type="pmid">40125090</pub-id></citation></ref>
<ref id="B59"><label>59.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Aghaei</surname> <given-names>M</given-names></name> <name><surname>Bahreiny</surname> <given-names>S</given-names></name> <name><surname>Zayeri</surname> <given-names>Z</given-names></name> <name><surname>Davari</surname> <given-names>N</given-names></name> <name><surname>Abolhasani</surname> <given-names>M</given-names></name> <name><surname>Saki</surname> <given-names>N</given-names></name></person-group>. <article-title>Evaluation of complete blood count parameters in patients with diabetes mellitus: a systematic review.</article-title> <source><italic>Health Sci Rep.</italic></source> (<year>2025</year>) <volume>8</volume>:<fpage>e70488</fpage>. <pub-id pub-id-type="doi">10.1002/hsr2.70488</pub-id> <pub-id pub-id-type="pmid">39995796</pub-id></citation></ref>
</ref-list>
</back>
</article>