<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Archiving and Interchange DTD v2.3 20070202//EN" "archivearticle.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="2.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Public Health</journal-id>
<journal-title>Frontiers in Public Health</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Public Health</abbrev-journal-title>
<issn pub-type="epub">2296-2565</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fpubh.2025.1509458</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Public Health</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>The relationship between epigenetic biomarkers and the risk of diabetes and cancer: a machine learning modeling approach</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" equal-contrib="yes">
<name><surname>Zhang</surname> <given-names>Shiqi</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="author-notes" rid="fn0001"><sup>&#x2020;</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/2989986/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author" corresp="yes" equal-contrib="yes">
<name><surname>Jin</surname> <given-names>Jianan</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>&#x002A;</sup></xref>
<xref ref-type="author-notes" rid="fn0001"><sup>&#x2020;</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/2665507/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author" equal-contrib="yes">
<name><surname>Xu</surname> <given-names>Benfeng</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="author-notes" rid="fn0001"><sup>&#x2020;</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Zheng</surname> <given-names>Qi</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/2585571/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Mou</surname> <given-names>Haibo</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>&#x002A;</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/2671784/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
</contrib-group>
<aff id="aff1"><sup>1</sup><institution>Department of Oncology, Shulan (Hangzhou) Hospital, Affiliated to Zhejiang Shuren University Shulan International Medical College</institution>, <addr-line>Hangzhou, Zhejiang</addr-line>, <country>China</country></aff>
<aff id="aff2"><sup>2</sup><institution>Graduate School, Zhejiang Chinese Medical University</institution>, <addr-line>Hangzhou, Zhejiang</addr-line>, <country>China</country></aff>
<aff id="aff3"><sup>3</sup><institution>State Key Laboratory for Diagnosis and Treatment of Infectious Diseases, National Clinical Research Center for Infectious Diseases, National Medical Center for Infectious Diseases, Collaborative Innovation Center for Diagnosis and Treatment of Infectious Diseases, The First Affiliated Hospital, Zhejiang University School of Medicine</institution>, <addr-line>Hangzhou</addr-line>, <country>China</country></aff>
<author-notes>
<fn fn-type="edited-by" id="fn0002">
<p>Edited by: Lai Xuefeng, Huazhong University of Science and Technology, China</p>
</fn>
<fn fn-type="edited-by" id="fn0003">
<p>Reviewed by: Giovanni Fiorito, IRCCS Giannina Gaslini Institute, Italy</p>
<p>Yi Zhe Wang, University of Michigan, United States</p>
</fn>
<corresp id="c001">&#x002A;Correspondence: Jianan Jin, <email>xzugfbmapf@outlook.com</email>; Haibo Mou, <email>haibo.mou@shulan.com</email></corresp>
<fn fn-type="equal" id="fn0001"><p><sup>&#x2020;</sup>These authors have contributed equally to this work and share first authorship</p></fn>
</author-notes>
<pub-date pub-type="epub">
<day>21</day>
<month>03</month>
<year>2025</year>
</pub-date>
<pub-date pub-type="collection">
<year>2025</year>
</pub-date>
<volume>13</volume>
<elocation-id>1509458</elocation-id>
<history>
<date date-type="received">
<day>11</day>
<month>10</month>
<year>2024</year>
</date>
<date date-type="accepted">
<day>24</day>
<month>02</month>
<year>2025</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x00A9; 2025 Zhang, Jin, Xu, Zheng and Mou.</copyright-statement>
<copyright-year>2025</copyright-year>
<copyright-holder>Zhang, Jin, Xu, Zheng and Mou</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<sec id="sec1">
<title>Introduction</title>
<p>Epigenetic biomarkers are molecular indicators of epigenetic changes, and some studies have suggested that these biomarkers have predictive power for disease risk. This study aims to analyze the relationship between 30 epigenetic biomarkers and the risk of diabetes and cancer using machine learning modeling.</p>
</sec>
<sec id="sec2">
<title>Methods</title>
<p>The data for this study were sourced from the NHANES database, which includes DNA methylation arrays and epigenetic biomarker datasets. Nine machine learning algorithms were used to build models: AdaBoost, GBM, KNN, lightGBM, MLP, RF, SVM, XGBoost, and logistics. Model stability was evaluated using metrics such as Accuracy, MCC, and Sensitivity. The performance and decision-making ability of the models were displayed using ROC curves and DCA curves, while SHAP values were used to visualize the importance of each epigenetic biomarker.</p>
</sec>
<sec id="sec3">
<title>Results</title>
<p>Epigenetic age acceleration was strongly associated with cancer risk but had a weaker relationship with diabetes. In the diabetes model, the top three contributing features were logA1Mort, family income-to-poverty ratio, and marital status. In the cancer model, the top three contributing features were gender, non-Hispanic White ethnicity, and PACKYRSMort.</p>
</sec>
<sec id="sec4">
<title>Conclusion</title>
<p>Our study identified the relationship between epigenetic biomarkers and the risk of diabetes and cancer, and used machine learning techniques to analyze the contributions of various epigenetic biomarkers to disease risk.</p>
</sec>
</abstract>
<kwd-group>
<kwd>epigenetic biomarkers</kwd>
<kwd>epigenetic clocks</kwd>
<kwd>epigenetic age acceleration</kwd>
<kwd>diabetes</kwd>
<kwd>cancer</kwd>
<kwd>machine learning</kwd>
</kwd-group>
<counts>
<fig-count count="11"/>
<table-count count="7"/>
<equation-count count="0"/>
<ref-count count="54"/>
<page-count count="20"/>
<word-count count="10220"/>
</counts>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Aging and Public Health</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec sec-type="intro" id="sec5">
<label>1</label>
<title>Introduction</title>
<p>Diabetes and cancer are major challenges in the field of global public health, with the incidence of these diseases continuing to rise (<xref ref-type="bibr" rid="ref1 ref2 ref3">1&#x2013;3</xref>), making it urgent to develop effective early detection signals and risk prediction tools.</p>
<p>Epigenetic biomarkers, particularly DNA methylation, are an important direction for studying the mechanisms underlying these diseases. DNA methylation is a process in which methyl groups are added to DNA, leading to changes in gene function, such as the silencing of tumor suppressor genes, activation of oncogenes, and abnormalities in promoter regions (<xref ref-type="bibr" rid="ref4 ref5 ref6 ref7">4&#x2013;7</xref>). These changes are closely linked to the development of various chronic diseases (<xref ref-type="bibr" rid="ref8 ref9 ref10">8&#x2013;10</xref>). However, existing studies have mostly been limited to a small number of epigenetic biomarkers and lack in-depth exploration of the specific relationships between these biomarkers and diseases in different contexts. Epigenetic age clocks are constructed based on specific DNA methylation sites (CpG sites) and can accurately predict an individual&#x2019;s &#x201C;biological age,&#x201D; which refers to the degree of aging of the body compared to its chronological age. By measuring different DNA methylation patterns, researchers have found that epigenetic age is not only highly correlated with chronological age (<xref ref-type="bibr" rid="ref11">11</xref>), but its acceleration (the difference between epigenetic age and chronological age) is considered a potential biomarker for aging and various diseases (<xref ref-type="bibr" rid="ref12">12</xref>). For example, accelerated epigenetic age has been found to be closely associated with several age-related diseases, such as diabetes, cancer, cardiovascular diseases, and others (<xref ref-type="bibr" rid="ref8">8</xref>, <xref ref-type="bibr" rid="ref13">13</xref>, <xref ref-type="bibr" rid="ref14">14</xref>).</p>
<p>In this study, we present 30 epigenetic biomarkers that have shown potential associations with diabetes and cancer in research across multiple fields. We expanded the selection scope and considered the biological significance of these biomarkers in the context of various diseases. These include epigenetic clocks (such as HorvathAge, LinAge, PhenoAge, WeidnerAge, etc.), lifespan and mortality-related biomarkers (such as GrimAgeMort, ADMMort, B2MMort, GDF15Mort, etc.), immune system biomarkers (such as CRPMor, CD8TPP, CD4TPP, NKcel, Bcell, etc.), and metabolism-related biomarkers (such as logA1CMort, LeptinMort, PACKYRSMort), which fall into three major categories of epigenetic material. For example, biomarkers like HorvathAge and GrimAge are closely associated with the aging process and the onset of various chronic diseases. LinAge, a biomarker associated with an individual&#x2019;s age, has demonstrated a strong correlation with biological aging (<xref ref-type="bibr" rid="ref15">15</xref>). Meanwhile, biomarkers such as LeptinMort and PACKYRSMort, which are linked to metabolic processes, smoking behaviors, and nutrition, have been confirmed in multiple studies to be associated with an increased risk of diabetes (<xref ref-type="bibr" rid="ref16">16</xref>, <xref ref-type="bibr" rid="ref17">17</xref>). Additionally, GDF15Mort is related to age-associated mitochondrial dysfunction (<xref ref-type="bibr" rid="ref18">18</xref>). Therefore, selecting these biomarkers as the focus of this study aims to explore their predictive ability and underlying mechanisms in diabetes and cancer.</p>
<p>Machine learning (ML), as an emerging artificial intelligence technology, offers advantages over traditional statistical analyses, such as higher predictive accuracy and the ability to maintain high prediction performance even with missing data. It is capable of making accurate predictions by utilizing data from various sources. The application of machine learning techniques in the medical field for disease diagnosis and prediction can significantly contribute to disease prevention and treatment (<xref ref-type="bibr" rid="ref19">19</xref>, <xref ref-type="bibr" rid="ref20">20</xref>). In recent years, machine learning has been applied across various fields of clinical disease diagnosis. For example, studies have widely applied machine learning algorithms in the monitoring of tumors and cardiovascular diseases (<xref ref-type="bibr" rid="ref21">21</xref>). Other research has used machine learning to analyze regularly collected electronic health record data and construct predictive models for the progression from prediabetes to type 2 diabetes (<xref ref-type="bibr" rid="ref22">22</xref>).</p>
<p>The core objective of this study is to explore the relationship between different epigenetic age clocks and diabetes and cancer, analyzing the potential role of accelerated epigenetic age in these diseases. Secondly, machine learning techniques were used to construct risk assessment models for diabetes and cancer based on epigenetic biomarkers, and their predictive effectiveness in clinical settings was validated. Lastly, by combining clinical features with epigenetic biomarkers, the study aims to optimize risk prediction models, providing a basis for early disease screening and personalized intervention. Nine machine learning algorithms were selected to build the models, and model evaluations and comparisons were conducted to identify the best model for predicting cancer and diabetes risks. Thirty epigenetic biomarkers were used to predict the risk of diabetes and cancer and visualized for analysis. The goal is to assess the value of each epigenetic biomarker in predicting the occurrence of diabetes and cancer, especially in the early screening and prediction of these diseases. Epigenetics will undoubtedly help unravel more mysteries about aging and its associated diseases, offering strong support for the implementation of precision medicine.</p>
</sec>
<sec sec-type="methods" id="sec6">
<label>2</label>
<title>Methods</title>
<sec id="sec7">
<label>2.1</label>
<title>Data sources and study population</title>
<p>The epigenetic biomarker data in this study are based on the DNA methylation array and epigenetic biomarker datasets from the NHANES database, an epidemiological survey program conducted by the National Center for Health Statistics (NCHS) at the Centers for Disease Control and Prevention (CDC) in the United States. DNA methylation array and epigenetic biomarker data were obtained from blood samples of participants. DNA was extracted from the samples and DNA methylation measurements were performed using the Illumina MethylationEPIC BeadChip. The methylation data were processed, preprocessed, and normalized to generate the epigenetic biomarker data (<xref ref-type="table" rid="tab1">Table 1</xref>) (NHANES website). Sex, age, race, education level, marital status, household income, and poverty ratio were obtained from participant questionnaires and physical measurement datasets. Questionnaire data were collected using standardized questionnaires, and physical measurements were conducted at specially designed and equipped mobile centers.</p>
<table-wrap position="float" id="tab1">
<label>Table 1</label>
<caption>
<p>Biomarkers of aging.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top">Variable</th>
<th align="left" valign="top">Role</th>
<th align="left" valign="top">Source</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="middle">HorvathAge (PMID: 24138928)</td>
<td align="left" valign="middle">Estimated chronological age</td>
<td align="left" valign="middle">51 tissues</td>
</tr>
<tr>
<td align="left" valign="middle">HannumAge (PMID: 23177740)</td>
<td align="left" valign="middle">Estimated chronological age</td>
<td align="left" valign="middle">Whole blood</td>
</tr>
<tr>
<td align="left" valign="middle">SkinBloodAge (PMID: 30048243)</td>
<td align="left" valign="middle">Estimated chronological age</td>
<td align="left" valign="middle">Skin and blood derived tissues</td>
</tr>
<tr>
<td align="left" valign="middle">PhenoAge (PMID: 29676998)</td>
<td align="left" valign="middle">Estimated chronological age</td>
<td align="left" valign="middle">Whole blood</td>
</tr>
<tr>
<td align="left" valign="middle">LinAge (PMID: 26928272)</td>
<td align="left" valign="middle">Estimated chronological age</td>
<td align="left" valign="middle">Whole blood</td>
</tr>
<tr>
<td align="left" valign="middle">WeidnerAge (PMID: 24490752)</td>
<td align="left" valign="middle">Estimated chronological age</td>
<td align="left" valign="middle">Whole blood</td>
</tr>
<tr>
<td align="left" valign="middle">VidalBraloAge (PMID: 27471517)</td>
<td align="left" valign="middle">Estimated chronological age</td>
<td align="left" valign="middle">Whole blood</td>
</tr>
<tr>
<td align="left" valign="middle">YangCell (PMID: 27716309)</td>
<td align="left" valign="middle">Forecasted mitotic cell division</td>
<td align="left" valign="middle">Whole blood</td>
</tr>
<tr>
<td align="left" valign="middle">ZhangAge (PMID: 31443728)</td>
<td align="left" valign="middle">Estimated chronological age</td>
<td align="left" valign="middle">Whole blood and saliva</td>
</tr>
<tr>
<td align="left" valign="middle">GrimAgeMort (PMID: 30669119)</td>
<td align="left" valign="middle">Estimated mortality</td>
<td align="left" valign="middle">Whole blood</td>
</tr>
<tr>
<td align="left" valign="middle">GrimAge2Mort (PMID: 36516495)</td>
<td align="left" valign="middle">Estimated mortality</td>
<td align="left" valign="middle">Whole blood</td>
</tr>
<tr>
<td align="left" valign="middle">DunedinPoAm (PMID: 32367804)</td>
<td align="left" valign="middle">predicted pace of aging</td>
<td align="left" valign="middle">Whole blood</td>
</tr>
<tr>
<td align="left" valign="middle">HorvathTelo (PMID: 31422385)</td>
<td align="left" valign="middle">Estimated telomere length</td>
<td align="left" valign="middle">Leukocytes</td>
</tr>
<tr>
<td align="left" valign="middle">ADMMort (PMID: 30669119)</td>
<td align="left" valign="middle">Predicted adrenomedullin</td>
<td align="left" valign="middle">Whole blood</td>
</tr>
<tr>
<td align="left" valign="middle">B2MMort (PMID: 30669119)</td>
<td align="left" valign="middle">Predicted beta-2 microglobulin</td>
<td align="left" valign="middle">Whole blood</td>
</tr>
<tr>
<td align="left" valign="middle">CystatinCMort1 (PMID: 30669119)</td>
<td align="left" valign="middle">predicted cystatin C</td>
<td align="left" valign="middle">Whole blood</td>
</tr>
<tr>
<td align="left" valign="middle">GDF15Mort (PMID: 30669119)</td>
<td align="left" valign="middle">Predicted Beta-2 growth differentiation factor 15 u</td>
<td align="left" valign="middle">Whole blood</td>
</tr>
<tr>
<td align="left" valign="middle">LeptinMort (PMID: 30669119)</td>
<td align="left" valign="middle">Predicted leptin</td>
<td align="left" valign="middle">Whole blood</td>
</tr>
<tr>
<td align="left" valign="middle">logA1CMort (PMID: 36516495)</td>
<td align="left" valign="middle">Expected hemoglobin A1c</td>
<td align="left" valign="middle">Whole blood</td>
</tr>
<tr>
<td align="left" valign="middle">CRPMort (PMID: 36516495)</td>
<td align="left" valign="middle">Predicted high sensitivity C-reactive protein</td>
<td align="left" valign="middle">Whole blood</td>
</tr>
<tr>
<td align="left" valign="middle">PACKYRSMort (PMID: 30669119)</td>
<td align="left" valign="middle">Predicted pack years of smoking</td>
<td align="left" valign="middle">Whole blood</td>
</tr>
<tr>
<td align="left" valign="middle">PAI1Mort (PMID: 30669119)</td>
<td align="left" valign="middle">Predicted plasminogen activation inhibitor</td>
<td align="left" valign="middle">Whole blood</td>
</tr>
<tr>
<td align="left" valign="middle">TIMP1Mort (PMID: 30669119)</td>
<td align="left" valign="middle">predicted tissue inhibitor metalloproteinase 1</td>
<td align="left" valign="middle">Whole blood</td>
</tr>
<tr>
<td align="left" valign="middle">CD8TPP (PMID: 23903776, PMID: 29843789, PMID: 26956433)</td>
<td align="left" valign="middle">Predicted CD8+ T-cell proportion</td>
<td align="left" valign="middle">Whole blood</td>
</tr>
<tr>
<td align="left" valign="middle">CD4TPP (PMID: 23903776, PMID: 29843789, PMID: 26956433)</td>
<td align="left" valign="middle">Predicted CD4+ T-cell proportion</td>
<td align="left" valign="middle">Whole blood</td>
</tr>
<tr>
<td align="left" valign="middle">NKcel (PMID: 23903776, PMID: 29843789, PMID: 26956433)</td>
<td align="left" valign="middle">Predicted natural killer cell proportion</td>
<td align="left" valign="middle">Whole blood</td>
</tr>
<tr>
<td align="left" valign="middle">Bcell (PMID: 23903776, PMID: 29843789, PMID: 26956433)</td>
<td align="left" valign="middle">Predicted B-cell proportion</td>
<td align="left" valign="middle">Whole blood</td>
</tr>
<tr>
<td align="left" valign="middle">MonoPP2 (PMID: 23903776, PMID: 29843789, PMID: 26956433)</td>
<td align="left" valign="middle">Predicted monocyte proportion</td>
<td align="left" valign="middle">Whole blood</td>
</tr>
<tr>
<td align="left" valign="middle">NeuPP (PMID: 23903776, PMID: 29843789, PMID: 26956433)</td>
<td align="left" valign="middle">Predicted neutrophil proportion</td>
<td align="left" valign="middle">Whole blood</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>In our study, race was categorized based on the questionnaire responses into five groups: Mexican American, non-Hispanic White, non-Hispanic Black, other Hispanic, and other races, with values assigned from 1 to 5. Education level was classified as high school or higher vs. less than high school. Marital status was categorized as married, cohabiting, or unmarried/not living with a partner. Household income and poverty ratio were divided into &#x2265;300 and &#x003C;300%, and BMI was categorized as &#x2265;24 and &#x003C;24.</p>
</sec>
<sec id="sec8">
<label>2.2</label>
<title>Statistical analysis</title>
<p>Descriptive statistical analyses were performed using R software (version 4.4.1) (<xref ref-type="table" rid="tab2">Tables 2</xref>, <xref ref-type="table" rid="tab3">3</xref>). For normally distributed continuous variables, means and standard deviations were reported, while for non-normally distributed continuous variables, medians and interquartile ranges were reported. Categorical variables were presented as percentages. Continuous variables were analyzed using t-tests or Mann&#x2013;Whitney U tests, while categorical variables were analyzed using chi-square tests or Fisher&#x2019;s exact tests.</p>
<table-wrap position="float" id="tab2">
<label>Table 2</label>
<caption>
<p>Cancer baseline table.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top" rowspan="2">Variable</th>
<th align="center" valign="top">Non-tumor patients</th>
<th align="center" valign="top">Tumor patients</th>
<th align="center" valign="top" rowspan="2"><italic>p</italic> Overall</th>
</tr>
<tr>
<th align="center" valign="top"><italic>N</italic>&#x202F;=&#x202F;1,083</th>
<th align="center" valign="top"><italic>N</italic>&#x202F;=&#x202F;174</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="middle">Sex:</td>
<td/>
<td/>
<td align="center" valign="middle">0.627</td>
</tr>
<tr>
<td align="left" valign="middle">Female</td>
<td align="center" valign="middle">523 (48.3%)</td>
<td align="center" valign="middle">80 (46.0%)</td>
<td/>
</tr>
<tr>
<td align="left" valign="middle">Male</td>
<td align="center" valign="middle">560 (51.7%)</td>
<td align="center" valign="middle">94 (54.0%)</td>
<td/>
</tr>
<tr>
<td align="left" valign="middle">Age</td>
<td align="center" valign="middle">63.8 (9.69)</td>
<td align="center" valign="middle">69.1 (10.00)</td>
<td align="center" valign="middle">&#x003C;0.001</td>
</tr>
<tr>
<td align="left" valign="middle">Race:</td>
<td/>
<td/>
<td align="center" valign="middle">&#x003C;0.001</td>
</tr>
<tr>
<td align="left" valign="middle">Mexican</td>
<td align="center" valign="middle">272 (25.1%)</td>
<td align="center" valign="middle">23 (13.2%)</td>
<td/>
</tr>
<tr>
<td align="left" valign="middle">Non-Hispanic whites</td>
<td align="center" valign="middle">63 (5.8%)</td>
<td align="center" valign="middle">6 (3.4%)</td>
<td/>
</tr>
<tr>
<td align="left" valign="middle">Non-Hispanic blacks</td>
<td align="center" valign="middle">459 (42.4%)</td>
<td align="center" valign="middle">119 (68.4%)</td>
<td/>
</tr>
<tr>
<td align="left" valign="middle">Other Hispanics</td>
<td align="center" valign="middle">249 (23.0%)</td>
<td align="center" valign="middle">25 (14.4%)</td>
<td/>
</tr>
<tr>
<td align="left" valign="middle">Other Ethnic Groups</td>
<td align="center" valign="middle">40 (3.7%)</td>
<td align="center" valign="middle">1 (0.6%)</td>
<td/>
</tr>
<tr>
<td align="left" valign="middle">Edu:</td>
<td/>
<td/>
<td align="center" valign="middle">0.039</td>
</tr>
<tr>
<td align="left" valign="middle">High school and above</td>
<td align="center" valign="middle">857 (79.1%)</td>
<td align="center" valign="middle">150 (86.2%)</td>
<td/>
</tr>
<tr>
<td align="left" valign="middle">Below high school</td>
<td align="center" valign="middle">226 (20.9%)</td>
<td align="center" valign="middle">24 (13.8%)</td>
<td/>
</tr>
<tr>
<td align="left" valign="middle">Marry:</td>
<td/>
<td/>
<td align="center" valign="middle">1.000</td>
</tr>
<tr>
<td align="left" valign="middle">Get married</td>
<td align="center" valign="middle">734 (67.8%)</td>
<td align="center" valign="middle">118 (67.8%)</td>
<td/>
</tr>
<tr>
<td align="left" valign="middle">Unmarried</td>
<td align="center" valign="middle">349 (32.2%)</td>
<td align="center" valign="middle">56 (32.2%)</td>
<td/>
</tr>
<tr>
<td align="left" valign="middle">Hypertension:</td>
<td/>
<td/>
<td align="center" valign="middle">0.053</td>
</tr>
<tr>
<td align="left" valign="middle">Didn&#x2019;t happened</td>
<td align="center" valign="middle">587 (54.2%)</td>
<td align="center" valign="middle">80 (46.0%)</td>
<td/>
</tr>
<tr>
<td align="left" valign="middle">Exist</td>
<td align="center" valign="middle">496 (45.8%)</td>
<td align="center" valign="middle">94 (54.0%)</td>
<td/>
</tr>
<tr>
<td align="left" valign="middle">Diabetes:</td>
<td/>
<td/>
<td align="center" valign="middle">0.278</td>
</tr>
<tr>
<td align="left" valign="middle">Didn&#x2019;t happened</td>
<td align="center" valign="middle">894 (82.5%)</td>
<td align="center" valign="middle">150 (86.2%)</td>
<td/>
</tr>
<tr>
<td align="left" valign="middle">Exist</td>
<td align="center" valign="middle">189 (17.5%)</td>
<td align="center" valign="middle">24 (13.8%)</td>
<td/>
</tr>
<tr>
<td align="left" valign="middle">HorvathAge</td>
<td align="center" valign="middle">65.2 (8.84)</td>
<td align="center" valign="middle">70.3 (9.81)</td>
<td align="center" valign="middle">&#x003C;0.001</td>
</tr>
<tr>
<td align="left" valign="middle">HannumAge</td>
<td align="center" valign="middle">64.8 (9.31)</td>
<td align="center" valign="middle">70.2 (9.80)</td>
<td align="center" valign="middle">&#x003C;0.001</td>
</tr>
<tr>
<td align="left" valign="middle">SkinBloodAge</td>
<td align="center" valign="middle">62.4 (9.27)</td>
<td align="center" valign="middle">67.4 (9.74)</td>
<td align="center" valign="middle">&#x003C;0.001</td>
</tr>
<tr>
<td align="left" valign="middle">PhenoAge</td>
<td align="center" valign="middle">53.3 (10.2)</td>
<td align="center" valign="middle">58.9 (11.0)</td>
<td align="center" valign="middle">&#x003C;0.001</td>
</tr>
<tr>
<td align="left" valign="middle">ZhangAge</td>
<td align="center" valign="middle">65.9 (3.62)</td>
<td align="center" valign="middle">68.0 (3.82)</td>
<td align="center" valign="middle">&#x003C;0.001</td>
</tr>
<tr>
<td align="left" valign="middle">LinAge</td>
<td align="center" valign="middle">55.3 (11.5)</td>
<td align="center" valign="middle">61.7 (13.3)</td>
<td align="center" valign="middle">&#x003C;0.001</td>
</tr>
<tr>
<td align="left" valign="middle">WeidnerAge</td>
<td align="center" valign="middle">53.5 (10.2)</td>
<td align="center" valign="middle">56.9 (11.8)</td>
<td align="center" valign="middle">&#x003C;0.001</td>
</tr>
<tr>
<td align="left" valign="middle">VidalBraloAge</td>
<td align="center" valign="middle">59.2 (6.27)</td>
<td align="center" valign="middle">63.0 (7.58)</td>
<td align="center" valign="middle">&#x003C;0.001</td>
</tr>
<tr>
<td align="left" valign="middle">HorvathAge acceleration</td>
<td align="center" valign="middle">1.40 (5.32)</td>
<td align="center" valign="middle">1.24 (6.14)</td>
<td align="center" valign="middle">0.755</td>
</tr>
<tr>
<td align="left" valign="middle">HannumAge acceleration</td>
<td align="center" valign="middle">0.98 (5.14)</td>
<td align="center" valign="middle">1.11 (5.64)</td>
<td align="center" valign="middle">0.779</td>
</tr>
<tr>
<td align="left" valign="middle">SkinBloodAge acceleration</td>
<td align="center" valign="middle">&#x2212;1.40 (4.12)</td>
<td align="center" valign="middle">&#x2212;1.64 (4.90)</td>
<td align="center" valign="middle">0.526</td>
</tr>
<tr>
<td align="left" valign="middle">PhenoAge acceleration</td>
<td align="center" valign="middle">&#x2212;10.45 (6.33)</td>
<td align="center" valign="middle">&#x2212;10.18 (6.90)</td>
<td align="center" valign="middle">0.626</td>
</tr>
<tr>
<td align="left" valign="middle">ZhangAge acceleration</td>
<td align="center" valign="middle">2.15 (6.47)</td>
<td align="center" valign="middle">&#x2212;1.06 (6.82)</td>
<td align="center" valign="middle">&#x003C;0.001</td>
</tr>
<tr>
<td align="left" valign="middle">LinAge acceleration</td>
<td align="center" valign="middle">&#x2212;8.43 (6.66)</td>
<td align="center" valign="middle">&#x2212;7.42 (8.51)</td>
<td align="center" valign="middle">0.134</td>
</tr>
<tr>
<td align="left" valign="middle">WeidnerAge acceleration</td>
<td align="center" valign="middle">&#x2212;10.32 (8.80)</td>
<td align="center" valign="middle">&#x2212;12.13 (10.1)</td>
<td align="center" valign="middle">0.027</td>
</tr>
<tr>
<td align="left" valign="middle">VidalBraloAge acceleration</td>
<td align="center" valign="middle">&#x2212;4.56 (7.32)</td>
<td align="center" valign="middle">&#x2212;6.08 (8.04)</td>
<td align="center" valign="middle">0.020</td>
</tr>
<tr>
<td align="left" valign="middle">GDF15Mort</td>
<td align="center" valign="middle">928 (154)</td>
<td align="center" valign="middle">1,010 (171)</td>
<td align="center" valign="middle">&#x003C;0.001</td>
</tr>
<tr>
<td align="left" valign="middle">B2MMort</td>
<td align="center" valign="middle">1,712,009 (168,743)</td>
<td align="center" valign="middle">1,780,582 (166,397)</td>
<td align="center" valign="middle">&#x003C;0.001</td>
</tr>
<tr>
<td align="left" valign="middle">CystatinCMort</td>
<td align="center" valign="middle">606,425 (38,641)</td>
<td align="center" valign="middle">625,317 (41,041)</td>
<td align="center" valign="middle">&#x003C;0.001</td>
</tr>
<tr>
<td align="left" valign="middle">TIMP1Mort</td>
<td align="center" valign="middle">35,106 (1,555)</td>
<td align="center" valign="middle">35,939 (1,663)</td>
<td align="center" valign="middle">&#x003C;0.001</td>
</tr>
<tr>
<td align="left" valign="middle">ADMMort</td>
<td align="center" valign="middle">347 (27.5)</td>
<td align="center" valign="middle">357 (26.8)</td>
<td align="center" valign="middle">&#x003C;0.001</td>
</tr>
<tr>
<td align="left" valign="middle">PAI1Mort</td>
<td align="center" valign="middle">17,262 (2,749)</td>
<td align="center" valign="middle">17,685 (2,632)</td>
<td align="center" valign="middle">0.052</td>
</tr>
<tr>
<td align="left" valign="middle">LeptinMort</td>
<td align="center" valign="middle">9,291 (4,075)</td>
<td align="center" valign="middle">9,198 (3,992)</td>
<td align="center" valign="middle">0.776</td>
</tr>
<tr>
<td align="left" valign="middle">PACKYRSMort</td>
<td align="center" valign="middle">18.0 (13.0)</td>
<td align="center" valign="middle">20.8 (12.6)</td>
<td align="center" valign="middle">0.007</td>
</tr>
<tr>
<td align="left" valign="middle">CRPMort</td>
<td align="center" valign="middle">0.73 (0.45)</td>
<td align="center" valign="middle">0.75 (0.45)</td>
<td align="center" valign="middle">0.508</td>
</tr>
<tr>
<td align="left" valign="middle">logA1CMort</td>
<td align="center" valign="middle">1.73 (0.03)</td>
<td align="center" valign="middle">1.73 (0.03)</td>
<td align="center" valign="middle">0.446</td>
</tr>
<tr>
<td align="left" valign="middle">GrimAgeMort</td>
<td align="center" valign="middle">64.2 (8.64)</td>
<td align="center" valign="middle">69.0 (9.12)</td>
<td align="center" valign="middle">&#x003C;0.001</td>
</tr>
<tr>
<td align="left" valign="middle">GrimAge2Mort</td>
<td align="center" valign="middle">70.0 (8.55)</td>
<td align="center" valign="middle">74.4 (9.04)</td>
<td align="center" valign="middle">&#x003C;0.001</td>
</tr>
<tr>
<td align="left" valign="middle">HorvathTelo</td>
<td align="center" valign="middle">6.63 (0.30)</td>
<td align="center" valign="middle">6.47 (0.34)</td>
<td align="center" valign="middle">&#x003C;0.001</td>
</tr>
<tr>
<td align="left" valign="middle">YangCell</td>
<td align="center" valign="middle">0.06 (0.02)</td>
<td align="center" valign="middle">0.07 (0.02)</td>
<td align="center" valign="middle">0.312</td>
</tr>
<tr>
<td align="left" valign="middle">DunedinPoAm</td>
<td align="center" valign="middle">1.10 (0.09)</td>
<td align="center" valign="middle">1.12 (0.09)</td>
<td align="center" valign="middle">0.020</td>
</tr>
<tr>
<td align="left" valign="middle">CD8TPP</td>
<td align="center" valign="middle">0.09 (0.04)</td>
<td align="center" valign="middle">0.09 (0.04)</td>
<td align="center" valign="middle">0.514</td>
</tr>
<tr>
<td align="left" valign="middle">CD4TPP</td>
<td align="center" valign="middle">0.17 (0.06)</td>
<td align="center" valign="middle">0.15 (0.07)</td>
<td align="center" valign="middle">&#x003C;0.001</td>
</tr>
<tr>
<td align="left" valign="middle">Nkcell</td>
<td align="center" valign="middle">0.06 (0.03)</td>
<td align="center" valign="middle">0.06 (0.03)</td>
<td align="center" valign="middle">0.158</td>
</tr>
<tr>
<td align="left" valign="middle">Bcell</td>
<td align="center" valign="middle">0.07 (0.03)</td>
<td align="center" valign="middle">0.06 (0.05)</td>
<td align="center" valign="middle">0.220</td>
</tr>
<tr>
<td align="left" valign="middle">MonoPP</td>
<td align="center" valign="middle">0.08 (0.02)</td>
<td align="center" valign="middle">0.08 (0.02)</td>
<td align="center" valign="middle">0.181</td>
</tr>
<tr>
<td align="left" valign="middle">NeuPP</td>
<td align="center" valign="middle">0.57 (0.11)</td>
<td align="center" valign="middle">0.60 (0.12)</td>
<td align="center" valign="middle">0.018</td>
</tr>
<tr>
<td align="left" valign="middle">WTDN4YR</td>
<td align="center" valign="middle">33,481 (31,803)</td>
<td align="center" valign="middle">38,071 (28,596)</td>
<td align="center" valign="middle">0.054</td>
</tr>
</tbody>
</table>
</table-wrap>
<table-wrap position="float" id="tab3">
<label>Table 3</label>
<caption>
<p>Diabetic baseline table.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top" rowspan="2">Variable</th>
<th align="center" valign="top">Non-diabetic</th>
<th align="center" valign="top">Diabetic</th>
<th align="center" valign="top" rowspan="2"><italic>p</italic> Overall</th>
</tr>
<tr>
<th align="center" valign="top"><italic>N</italic>&#x202F;=&#x202F;1,810</th>
<th align="center" valign="top"><italic>N</italic>&#x202F;=&#x202F;394</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="middle">Age</td>
<td align="center" valign="middle">65.6 (10.1)</td>
<td align="center" valign="middle">66.6 (8.99)</td>
<td align="center" valign="middle">0.048</td>
</tr>
<tr>
<td align="left" valign="middle">Race:</td>
<td/>
<td/>
<td align="center" valign="middle">&#x003C;0.001</td>
</tr>
<tr>
<td align="left" valign="middle">Mexican</td>
<td align="center" valign="middle">481 (26.6%)</td>
<td align="center" valign="middle">135 (34.3%)</td>
<td/>
</tr>
<tr>
<td align="left" valign="middle">Non-Hispanic whites</td>
<td align="center" valign="middle">115 (6.4%)</td>
<td align="center" valign="middle">30 (7.6%)</td>
<td/>
</tr>
<tr>
<td align="left" valign="middle">Non-Hispanic blacks</td>
<td align="center" valign="middle">800 (44.2%)</td>
<td align="center" valign="middle">106 (26.9%)</td>
<td/>
</tr>
<tr>
<td align="left" valign="middle">Other Hispanics</td>
<td align="center" valign="middle">357 (19.7%)</td>
<td align="center" valign="middle">107 (27.1%)</td>
<td/>
</tr>
<tr>
<td align="left" valign="middle">Other Ethnic Groups</td>
<td align="center" valign="middle">57 (3.1%)</td>
<td align="center" valign="middle">16 (4.1%)</td>
<td/>
</tr>
<tr>
<td align="left" valign="middle">Edu:</td>
<td/>
<td/>
<td align="center" valign="middle">0.001</td>
</tr>
<tr>
<td align="left" valign="middle">High school and above</td>
<td align="center" valign="middle">1,358 (75.0%)</td>
<td align="center" valign="middle">262 (66.5%)</td>
<td/>
</tr>
<tr>
<td align="left" valign="middle">Below high school</td>
<td align="center" valign="middle">452 (25.0%)</td>
<td align="center" valign="middle">132 (33.5%)</td>
<td/>
</tr>
<tr>
<td align="left" valign="middle">Marry:</td>
<td/>
<td/>
<td align="center" valign="middle">0.918</td>
</tr>
<tr>
<td align="left" valign="middle">Get married</td>
<td align="center" valign="middle">1,170 (64.6%)</td>
<td align="center" valign="middle">253 (64.2%)</td>
<td/>
</tr>
<tr>
<td align="left" valign="middle">Unmarried</td>
<td align="center" valign="middle">640 (35.4%)</td>
<td align="center" valign="middle">141 (35.8%)</td>
<td/>
</tr>
<tr>
<td align="left" valign="middle">Hypertension:</td>
<td/>
<td/>
<td align="center" valign="middle">&#x003C;0.001</td>
</tr>
<tr>
<td align="left" valign="middle">Didn&#x2019;t happened</td>
<td align="center" valign="middle">1,018 (56.2%)</td>
<td align="center" valign="middle">138 (35.0%)</td>
<td/>
</tr>
<tr>
<td align="left" valign="middle">Exist</td>
<td align="center" valign="middle">792 (43.8%)</td>
<td align="center" valign="middle">256 (65.0%)</td>
<td/>
</tr>
<tr>
<td align="left" valign="middle">HorvathAge</td>
<td align="center" valign="middle">66.5 (9.23)</td>
<td align="center" valign="middle">67.8 (8.43)</td>
<td align="center" valign="middle">0.007</td>
</tr>
<tr>
<td align="left" valign="middle">HannumAge</td>
<td align="center" valign="middle">66.6 (9.75)</td>
<td align="center" valign="middle">68.1 (9.05)</td>
<td align="center" valign="middle">0.003</td>
</tr>
<tr>
<td align="left" valign="middle">SkinBloodAge</td>
<td align="center" valign="middle">64.1 (9.74)</td>
<td align="center" valign="middle">65.4 (8.86)</td>
<td align="center" valign="middle">0.006</td>
</tr>
<tr>
<td align="left" valign="middle">PhenoAge</td>
<td align="center" valign="middle">55.2 (10.8)</td>
<td align="center" valign="middle">56.8 (9.86)</td>
<td align="center" valign="middle">0.004</td>
</tr>
<tr>
<td align="left" valign="middle">ZhangAge</td>
<td align="center" valign="middle">66.6 (3.82)</td>
<td align="center" valign="middle">67.1 (3.45)</td>
<td align="center" valign="middle">0.029</td>
</tr>
<tr>
<td align="left" valign="middle">LinAge</td>
<td align="center" valign="middle">57.0 (12.5)</td>
<td align="center" valign="middle">58.7 (11.2)</td>
<td align="center" valign="middle">0.010</td>
</tr>
<tr>
<td align="left" valign="middle">WeidnerAge</td>
<td align="center" valign="middle">54.2 (10.9)</td>
<td align="center" valign="middle">54.9 (9.46)</td>
<td align="center" valign="middle">0.197</td>
</tr>
<tr>
<td align="left" valign="middle">VidalBraloAge</td>
<td align="center" valign="middle">60.2 (6.89)</td>
<td align="center" valign="middle">60.5 (6.44)</td>
<td align="center" valign="middle">0.326</td>
</tr>
<tr>
<td align="left" valign="middle">HorvathAge acceleration</td>
<td align="center" valign="middle">0.85 (5.56)</td>
<td align="center" valign="middle">1.12 (6.02)</td>
<td align="center" valign="middle">0.416</td>
</tr>
<tr>
<td align="left" valign="middle">HannumAge acceleration</td>
<td align="center" valign="middle">0.97 (5.50)</td>
<td align="center" valign="middle">1.49 (5.29)</td>
<td align="center" valign="middle">0.077</td>
</tr>
<tr>
<td align="left" valign="middle">SkinBloodAge acceleration</td>
<td align="center" valign="middle">&#x2212;1.56 (4.51)</td>
<td align="center" valign="middle">&#x2212;1.20 (4.67)</td>
<td align="center" valign="middle">0.161</td>
</tr>
<tr>
<td align="left" valign="middle">PhenoAge acceleration</td>
<td align="center" valign="middle">&#x2212;10.45 (6.67)</td>
<td align="center" valign="middle">&#x2212;9.85 (6.85)</td>
<td align="center" valign="middle">0.118</td>
</tr>
<tr>
<td align="left" valign="middle">ZhangAge acceleration</td>
<td align="center" valign="middle">1.00 (6.74)</td>
<td align="center" valign="middle">0.41 (6.14)</td>
<td align="center" valign="middle">0.094</td>
</tr>
<tr>
<td align="left" valign="middle">LinAge acceleration</td>
<td align="center" valign="middle">&#x2212;8.58 (7.57)</td>
<td align="center" valign="middle">&#x2212;7.96 (7.07)</td>
<td align="center" valign="middle">0.118</td>
</tr>
<tr>
<td align="left" valign="middle">WeidnerAge acceleration</td>
<td align="center" valign="middle">&#x2212;11.44 (9.56)</td>
<td align="center" valign="middle">&#x2212;11.75 (9.15)</td>
<td align="center" valign="middle">0.544</td>
</tr>
<tr>
<td align="left" valign="middle">VidalBraloAge acceleration</td>
<td align="center" valign="middle">&#x2212;5.45 (7.58)</td>
<td align="center" valign="middle">&#x2212;6.11 (7.47)</td>
<td align="center" valign="middle">0.116</td>
</tr>
<tr>
<td align="left" valign="middle">GDF15Mort</td>
<td align="center" valign="middle">962 (167)</td>
<td align="center" valign="middle">983 (149)</td>
<td align="center" valign="middle">0.014</td>
</tr>
<tr>
<td align="left" valign="middle">B2MMort</td>
<td align="center" valign="middle">1,743,827 (175,105)</td>
<td align="center" valign="middle">1,769,706 (171,428)</td>
<td align="center" valign="middle">0.007</td>
</tr>
<tr>
<td align="left" valign="middle">CystatinCMort</td>
<td align="center" valign="middle">614,217 (40,737)</td>
<td align="center" valign="middle">620,710 (37,297)</td>
<td align="center" valign="middle">0.002</td>
</tr>
<tr>
<td align="left" valign="middle">TIMP1Mort</td>
<td align="center" valign="middle">35,388 (1,613)</td>
<td align="center" valign="middle">35,655 (1,421)</td>
<td align="center" valign="middle">0.001</td>
</tr>
<tr>
<td align="left" valign="middle">ADMMort</td>
<td align="center" valign="middle">350 (27.0)</td>
<td align="center" valign="middle">353 (25.6)</td>
<td align="center" valign="middle">0.018</td>
</tr>
<tr>
<td align="left" valign="middle">PAI1Mort</td>
<td align="center" valign="middle">17,179 (2,752)</td>
<td align="center" valign="middle">18,550 (2,703)</td>
<td align="center" valign="middle">&#x003C;0.001</td>
</tr>
<tr>
<td align="left" valign="middle">LeptinMort</td>
<td align="center" valign="middle">9,330 (4,053)</td>
<td align="center" valign="middle">9,958 (4,299)</td>
<td align="center" valign="middle">0.008</td>
</tr>
<tr>
<td align="left" valign="middle">PACKYRSMort</td>
<td align="center" valign="middle">18.8 (13.4)</td>
<td align="center" valign="middle">19.4 (12.1)</td>
<td align="center" valign="middle">0.369</td>
</tr>
<tr>
<td align="left" valign="middle">CRPMort</td>
<td align="center" valign="middle">0.75 (0.46)</td>
<td align="center" valign="middle">0.93 (0.44)</td>
<td align="center" valign="middle">&#x003C;0.001</td>
</tr>
<tr>
<td align="left" valign="middle">logA1CMort</td>
<td align="center" valign="middle">1.72 (0.03)</td>
<td align="center" valign="middle">1.75 (0.03)</td>
<td align="center" valign="middle">&#x003C;0.001</td>
</tr>
<tr>
<td align="left" valign="middle">GrimAgeMort</td>
<td align="center" valign="middle">65.8 (8.93)</td>
<td align="center" valign="middle">67.3 (7.94)</td>
<td align="center" valign="middle">&#x003C;0.001</td>
</tr>
<tr>
<td align="left" valign="middle">GrimAge2Mort</td>
<td align="center" valign="middle">71.5 (8.82)</td>
<td align="center" valign="middle">73.6 (7.79)</td>
<td align="center" valign="middle">&#x003C;0.001</td>
</tr>
<tr>
<td align="left" valign="middle">HorvathTelo</td>
<td align="center" valign="middle">6.58 (0.31)</td>
<td align="center" valign="middle">6.56 (0.31)</td>
<td align="center" valign="middle">0.220</td>
</tr>
<tr>
<td align="left" valign="middle">YangCell</td>
<td align="center" valign="middle">0.06 (0.02)</td>
<td align="center" valign="middle">0.07 (0.02)</td>
<td align="center" valign="middle">0.048</td>
</tr>
<tr>
<td align="left" valign="middle">DunedinPoAm</td>
<td align="center" valign="middle">1.11 (0.09)</td>
<td align="center" valign="middle">1.12 (0.09)</td>
<td align="center" valign="middle">0.125</td>
</tr>
<tr>
<td align="left" valign="middle">CD8TPP</td>
<td align="center" valign="middle">0.09 (0.04)</td>
<td align="center" valign="middle">0.10 (0.05)</td>
<td align="center" valign="middle">0.237</td>
</tr>
<tr>
<td align="left" valign="middle">CD4TPP</td>
<td align="center" valign="middle">0.17 (0.06)</td>
<td align="center" valign="middle">0.16 (0.07)</td>
<td align="center" valign="middle">0.503</td>
</tr>
<tr>
<td align="left" valign="middle">Nkcell</td>
<td align="center" valign="middle">0.06 (0.03)</td>
<td align="center" valign="middle">0.06 (0.03)</td>
<td align="center" valign="middle">0.616</td>
</tr>
<tr>
<td align="left" valign="middle">Bcell</td>
<td align="center" valign="middle">0.07 (0.03)</td>
<td align="center" valign="middle">0.07 (0.03)</td>
<td align="center" valign="middle">0.877</td>
</tr>
<tr>
<td align="left" valign="middle">MonoPP</td>
<td align="center" valign="middle">0.08 (0.02)</td>
<td align="center" valign="middle">0.08 (0.02)</td>
<td align="center" valign="middle">0.938</td>
</tr>
<tr>
<td align="left" valign="middle">NeuPP</td>
<td align="center" valign="middle">0.59 (0.11)</td>
<td align="center" valign="middle">0.59 (0.11)</td>
<td align="center" valign="middle">0.718</td>
</tr>
<tr>
<td align="left" valign="middle">WTDN4YR</td>
<td align="center" valign="middle">32,234 (30,634)</td>
<td align="center" valign="middle">21,961 (25,770)</td>
<td align="center" valign="middle">&#x003C;0.001</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="sec9">
<label>2.3</label>
<title>Machine learning modeling</title>
<p>The study population was randomly divided into training and validation sets at an 80:20 ratio, followed by standardization preprocessing. Nine machine learning algorithms, including AdaBoost, GBM, KNN, LightGBM, MLP, RF, SVM, XGBoost, and Logistic Regression (see <xref ref-type="table" rid="tab4">Table 4</xref> for details), were used to develop predictive models.</p>
<table-wrap position="float" id="tab4">
<label>Table 4</label>
<caption>
<p>Comparison of differences among 9 machine learning models.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top">Name</th>
<th align="left" valign="top">Features</th>
<th align="left" valign="top">Advantages</th>
<th align="left" valign="top">Disadvantages</th>
<th align="left" valign="top">Applicable Scenarios</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="top">AdaBoost (Adaptive boosting)</td>
<td align="left" valign="top">Gradually improve model performance by combining multiple weak classifiers (typically decision trees), with a particular emphasis on samples that were previously misclassified.</td>
<td align="left" valign="top">Improve classification accuracy; simple and easy to implement; applicable to binary classification problems.</td>
<td align="left" valign="top">Sensitive to outliers and noise; difficult to handle multi-class problems.</td>
<td align="left" valign="top">Binary classification tasks; scenarios where the performance of simple models needs to be improved.</td>
</tr>
<tr>
<td align="left" valign="top">GBM (Gradient boosting machine)</td>
<td align="left" valign="top">Optimize the loss function by gradually adding decision trees and use gradient descent methods to minimize error.</td>
<td align="left" valign="top">Powerful predictive ability; high flexibility; capable of optimizing various loss functions.</td>
<td align="left" valign="top">Long training time; prone to overfitting; complex parameter tuning.</td>
<td align="left" valign="top">Regression and classification tasks; prediction problems on complex datasets.</td>
</tr>
<tr>
<td align="left" valign="top">KNN (K-nearest neighbors)</td>
<td align="left" valign="top">Based on distance metrics; make predictions by finding the nearest K neighbors; applicable to classification and regression.</td>
<td align="left" valign="top">Simple and intuitive; no training process required; suitable for small datasets.</td>
<td align="left" valign="top">High computational cost; poor performance on high-dimensional data; sensitive to noise.</td>
<td align="left" valign="top">Classification and regression tasks; small-scale datasets; scenarios requiring simple models.</td>
</tr>
<tr>
<td align="left" valign="top">LightGBM (Light gradient boosting machine)</td>
<td align="left" valign="top">An efficient gradient boosting framework developed by Microsoft, utilizing histogram-based decision tree algorithms, supporting categorical features, offering fast training speed, and low memory consumption.</td>
<td align="left" valign="top">Fast training speed; high memory efficiency; supports large-scale data; efficient handling of categorical features.</td>
<td align="left" valign="top">Complex parameter tuning; sensitive to outliers; not suitable for small datasets.</td>
<td align="left" valign="top">Large-scale datasets; tasks requiring fast training and prediction; scenarios with many categorical features.</td>
</tr>
<tr>
<td align="left" valign="top">MLP (Multi-layer perceptron)</td>
<td align="left" valign="top">A multilayer perceptron consists of multiple hidden layers, uses nonlinear activation functions, and is capable of learning complex patterns and relationships.</td>
<td align="left" valign="top">Able to capture complex nonlinear relationships; suitable for various tasks (classification, regression).</td>
<td align="left" valign="top">Long training time; requires large amounts of data; difficult to interpret; prone to overfitting.</td>
<td align="left" valign="top">Large-scale and complex datasets; tasks requiring handling of nonlinear relationships.</td>
</tr>
<tr>
<td align="left" valign="top">RF (Random forest)</td>
<td align="left" valign="top">By constructing multiple decision trees and combining their prediction results, randomly selecting features and samples to generate diverse tree structures.</td>
<td align="left" valign="top">Strong resistance to overfitting; suitable for high-dimensional data; capable of handling missing values; easy to parallelize.</td>
<td align="left" valign="top">Large model size; slow prediction speed; difficult to interpret.</td>
<td align="left" valign="top">Classification and regression tasks; high-dimensional data; scenarios requiring robust models.</td>
</tr>
<tr>
<td align="left" valign="top">SVM (Support vector machine)</td>
<td align="left" valign="top">Finds a hyperplane that maximizes the classification margin; applicable to high-dimensional and small-sample data; handles nonlinear boundaries through kernel functions.</td>
<td align="left" valign="top">Performs well in high-dimensional spaces; suitable for small-sample data; handles nonlinear problems through kernel functions.</td>
<td align="left" valign="top">Long training time; not friendly to large-scale datasets; complex parameter tuning; sensitive to noise.</td>
<td align="left" valign="top">High-dimensional data; small-scale datasets; tasks requiring precise classification boundaries.</td>
</tr>
<tr>
<td align="left" valign="top">XGBoost (Extreme gradient boosting)</td>
<td align="left" valign="top">An optimized gradient boosting framework with efficient implementation and strong performance, incorporating parallel processing, regularization, and pruning techniques.</td>
<td align="left" valign="top">High performance; strong scalability; supports parallel computing; prevents overfitting; widely used in competitions and real-world problems.</td>
<td align="left" valign="top">Parameter tuning is complex; training time is relatively long; and there are high requirements for data preprocessing.</td>
<td align="left" valign="top">Regression and classification tasks of various types; scenarios requiring high prediction accuracy and model performance; large-scale datasets.</td>
</tr>
<tr>
<td align="left" valign="top">Logistic regression</td>
<td align="left" valign="top">Transforms the linearly combined input features into probability values using a logistic function (e.g., the Sigmoid function), suitable for binary and multiclass classification problems.</td>
<td align="left" valign="top">Simple and easy to understand; computationally efficient; strong model interpretability; suitable for linearly separable data.</td>
<td align="left" valign="top">Only applicable to linear relationships; sensitive to multicollinearity; not suitable for handling complex nonlinear relationships.</td>
<td align="left" valign="top">Binary and multiclass classification tasks; scenarios where model interpretability is required; linearly separable datasets.</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>Oversampling was performed using SMOTE to balance the positive and negative samples, generating more positive samples to alleviate the class imbalance issue. The dataset was then divided into training and test sets. CV was set to 5, indicating 5-fold cross-validation, which was used to assess the average performance of the model under different parameter combinations. The training dataset was randomly divided into five mutually exclusive subsets (folds), with one subset used as the validation set in each iteration, and the remaining four subsets combined for training. This process allowed for 5 training and validation cycles, resulting in five validation outcomes. Grid search (GridSearchCV) was used in conjunction with cross-validation to exhaustively search the parameter grid and return the optimal parameter combination for the machine learning model, thereby achieving the best performing model. Metrics such as Positive Predictive Value, Negative Predictive Value, Sensitivity, Specificity, Matthews Correlation Coefficient, AUC, Kappa, Brier Score, accuracy, and F1 Score were used to evaluate model performance (<xref ref-type="table" rid="tab5">Tables 5</xref>, <xref ref-type="table" rid="tab6">6</xref>). The Positive Predictive Value (PPV) reflects the accuracy of the model&#x2019;s positive predictions, with higher values indicating fewer false positives. The F1 score ranges from 0 to 1, with higher values indicating a better balance between precision and recall, making it suitable for imbalanced class problems. The above metrics, combined with ROC curves (<xref ref-type="fig" rid="fig1">Figures 1</xref>, <xref ref-type="fig" rid="fig2">2</xref>) and DCA curves (<xref ref-type="fig" rid="fig3">Figures 3</xref>, <xref ref-type="fig" rid="fig4">4</xref>), were used to assess the stability and clinical decision-making ability of the model (<xref ref-type="bibr" rid="ref23">23</xref>).</p>
<table-wrap position="float" id="tab5">
<label>Table 5</label>
<caption>
<p>Diabetes prediction model performance evaluation.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top">Model</th>
<th align="center" valign="top">PPV</th>
<th align="center" valign="top">NPV</th>
<th align="center" valign="top">Sensitivity</th>
<th align="center" valign="top">Specificity</th>
<th align="center" valign="top">MCC</th>
<th align="center" valign="top">AUC</th>
<th align="center" valign="top">Kappa</th>
<th align="center" valign="top">Brier Score</th>
<th align="center" valign="top">F1</th>
<th align="center" valign="top">Accuracy</th>
<th align="center" valign="top">Precision</th>
<th align="center" valign="top">Recall</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="top">AdaBoost</td>
<td align="center" valign="top">0.66</td>
<td align="center" valign="top">0.88</td>
<td align="center" valign="top">0.91</td>
<td align="center" valign="top">0.58</td>
<td align="center" valign="top">0.52</td>
<td align="center" valign="top">0.9</td>
<td align="center" valign="top">0.49</td>
<td align="center" valign="top">0.25</td>
<td align="center" valign="top">0.77</td>
<td align="center" valign="top">0.74</td>
<td align="center" valign="top">0.66</td>
<td align="center" valign="top">0.91</td>
</tr>
<tr>
<td align="left" valign="top">GBM</td>
<td align="center" valign="top">0.71</td>
<td align="center" valign="top">0.89</td>
<td align="center" valign="top">0.91</td>
<td align="center" valign="top">0.67</td>
<td align="center" valign="top">0.59</td>
<td align="center" valign="top">0.92</td>
<td align="center" valign="top">0.57</td>
<td align="center" valign="top">0.15</td>
<td align="center" valign="top">0.8</td>
<td align="center" valign="top">0.78</td>
<td align="center" valign="top">0.71</td>
<td align="center" valign="top">0.91</td>
</tr>
<tr>
<td align="left" valign="top">GradientBoosting</td>
<td align="center" valign="top">0.72</td>
<td align="center" valign="top">0.89</td>
<td align="center" valign="top">0.91</td>
<td align="center" valign="top">0.67</td>
<td align="center" valign="top">0.59</td>
<td align="center" valign="top">0.92</td>
<td align="center" valign="top">0.57</td>
<td align="center" valign="top">0.15</td>
<td align="center" valign="top">0.8</td>
<td align="center" valign="top">0.78</td>
<td align="center" valign="top">0.72</td>
<td align="center" valign="top">0.91</td>
</tr>
<tr>
<td align="left" valign="top">KNN</td>
<td align="center" valign="top">0.67</td>
<td align="center" valign="top">0.88</td>
<td align="center" valign="top">0.91</td>
<td align="center" valign="top">0.6</td>
<td align="center" valign="top">0.53</td>
<td align="center" valign="top">0.83</td>
<td align="center" valign="top">0.5</td>
<td align="center" valign="top">0.19</td>
<td align="center" valign="top">0.77</td>
<td align="center" valign="top">0.75</td>
<td align="center" valign="top">0.67</td>
<td align="center" valign="top">0.91</td>
</tr>
<tr>
<td align="left" valign="top">LightGBM</td>
<td align="center" valign="top">0.84</td>
<td align="center" valign="top">0.92</td>
<td align="center" valign="top">0.92</td>
<td align="center" valign="top">0.84</td>
<td align="center" valign="top">0.76</td>
<td align="center" valign="top">0.96</td>
<td align="center" valign="top">0.75</td>
<td align="center" valign="top">0.09</td>
<td align="center" valign="top">0.88</td>
<td align="center" valign="top">0.88</td>
<td align="center" valign="top">0.84</td>
<td align="center" valign="top">0.92</td>
</tr>
<tr>
<td align="left" valign="top">MLP</td>
<td align="center" valign="top">0.0</td>
<td align="center" valign="top">0.52</td>
<td align="center" valign="top">0.0</td>
<td align="center" valign="top">1.0</td>
<td align="center" valign="top">0.0</td>
<td align="center" valign="top">0.5</td>
<td align="center" valign="top">0.0</td>
<td align="center" valign="top">0.48</td>
<td align="center" valign="top">0.0</td>
<td align="center" valign="top">0.52</td>
<td align="center" valign="top">1.0</td>
<td align="center" valign="top">0.0</td>
</tr>
<tr>
<td align="left" valign="top">RF</td>
<td align="center" valign="top">0.86</td>
<td align="center" valign="top">0.86</td>
<td align="center" valign="top">0.85</td>
<td align="center" valign="top">0.87</td>
<td align="center" valign="top">0.72</td>
<td align="center" valign="top">0.94</td>
<td align="center" valign="top">0.72</td>
<td align="center" valign="top">0.11</td>
<td align="center" valign="top">0.85</td>
<td align="center" valign="top">0.86</td>
<td align="center" valign="top">0.86</td>
<td align="center" valign="top">0.85</td>
</tr>
<tr>
<td align="left" valign="top">SVM</td>
<td align="center" valign="top">0.48</td>
<td align="center" valign="top">0.0</td>
<td align="center" valign="top">1.0</td>
<td align="center" valign="top">0.0</td>
<td align="center" valign="top">0.0</td>
<td align="center" valign="top">0.36</td>
<td align="center" valign="top">0.0</td>
<td align="center" valign="top">0.26</td>
<td align="center" valign="top">0.64</td>
<td align="center" valign="top">0.48</td>
<td align="center" valign="top">0.48</td>
<td align="center" valign="top">1.0</td>
</tr>
<tr>
<td align="left" valign="top">XGBoost</td>
<td align="center" valign="top">0.82</td>
<td align="center" valign="top">0.91</td>
<td align="center" valign="top">0.91</td>
<td align="center" valign="top">0.82</td>
<td align="center" valign="top">0.73</td>
<td align="center" valign="top">0.96</td>
<td align="center" valign="top">0.73</td>
<td align="center" valign="top">0.1</td>
<td align="center" valign="top">0.87</td>
<td align="center" valign="top">0.86</td>
<td align="center" valign="top">0.82</td>
<td align="center" valign="top">0.91</td>
</tr>
<tr>
<td align="left" valign="top">LogisticRegression</td>
<td align="center" valign="top">0.48</td>
<td align="center" valign="top">0.76</td>
<td align="center" valign="top">0.98</td>
<td align="center" valign="top">0.05</td>
<td align="center" valign="top">0.09</td>
<td align="center" valign="top">0.67</td>
<td align="center" valign="top">0.03</td>
<td align="center" valign="top">0.34</td>
<td align="center" valign="top">0.65</td>
<td align="center" valign="top">0.49</td>
<td align="center" valign="top">0.48</td>
<td align="center" valign="top">0.98</td>
</tr>
</tbody>
</table>
</table-wrap>
<table-wrap position="float" id="tab6">
<label>Table 6</label>
<caption>
<p>Cancer prediction model performance evaluation.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top">Model</th>
<th align="center" valign="top">PPV</th>
<th align="center" valign="top">NPV</th>
<th align="center" valign="top">Sensitivity</th>
<th align="center" valign="top">Specificity</th>
<th align="center" valign="top">MCC</th>
<th align="center" valign="top">AUC</th>
<th align="center" valign="top">Kappa</th>
<th align="center" valign="top">Brier Score</th>
<th align="center" valign="top">F1</th>
<th align="center" valign="top">Accuracy</th>
<th align="center" valign="top">Precision</th>
<th align="center" valign="top">Recall</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="top">AdaBoost</td>
<td align="center" valign="top">0.71</td>
<td align="center" valign="top">0.92</td>
<td align="center" valign="top">0.94</td>
<td align="center" valign="top">0.63</td>
<td align="center" valign="top">0.6</td>
<td align="center" valign="top">0.9</td>
<td align="center" valign="top">0.57</td>
<td align="center" valign="top">0.24</td>
<td align="center" valign="top">0.81</td>
<td align="center" valign="top">0.78</td>
<td align="center" valign="top">0.71</td>
<td align="center" valign="top">0.94</td>
</tr>
<tr>
<td align="left" valign="top">GBM</td>
<td align="center" valign="top">0.81</td>
<td align="center" valign="top">0.95</td>
<td align="center" valign="top">0.96</td>
<td align="center" valign="top">0.78</td>
<td align="center" valign="top">0.75</td>
<td align="center" valign="top">0.96</td>
<td align="center" valign="top">0.74</td>
<td align="center" valign="top">0.1</td>
<td align="center" valign="top">0.88</td>
<td align="center" valign="top">0.87</td>
<td align="center" valign="top">0.81</td>
<td align="center" valign="top">0.96</td>
</tr>
<tr>
<td align="left" valign="top">GradientBoosting</td>
<td align="center" valign="top">0.81</td>
<td align="center" valign="top">0.95</td>
<td align="center" valign="top">0.96</td>
<td align="center" valign="top">0.78</td>
<td align="center" valign="top">0.75</td>
<td align="center" valign="top">0.96</td>
<td align="center" valign="top">0.74</td>
<td align="center" valign="top">0.1</td>
<td align="center" valign="top">0.88</td>
<td align="center" valign="top">0.87</td>
<td align="center" valign="top">0.81</td>
<td align="center" valign="top">0.96</td>
</tr>
<tr>
<td align="left" valign="top">KNN</td>
<td align="center" valign="top">0.71</td>
<td align="center" valign="top">0.86</td>
<td align="center" valign="top">0.9</td>
<td align="center" valign="top">0.65</td>
<td align="center" valign="top">0.56</td>
<td align="center" valign="top">0.86</td>
<td align="center" valign="top">0.54</td>
<td align="center" valign="top">0.17</td>
<td align="center" valign="top">0.79</td>
<td align="center" valign="top">0.77</td>
<td align="center" valign="top">0.71</td>
<td align="center" valign="top">0.9</td>
</tr>
<tr>
<td align="left" valign="top">LightGBM</td>
<td align="center" valign="top">0.87</td>
<td align="center" valign="top">0.96</td>
<td align="center" valign="top">0.96</td>
<td align="center" valign="top">0.86</td>
<td align="center" valign="top">0.83</td>
<td align="center" valign="top">0.98</td>
<td align="center" valign="top">0.82</td>
<td align="center" valign="top">0.07</td>
<td align="center" valign="top">0.91</td>
<td align="center" valign="top">0.91</td>
<td align="center" valign="top">0.87</td>
<td align="center" valign="top">0.96</td>
</tr>
<tr>
<td align="left" valign="top">MLP</td>
<td align="center" valign="top">0.5</td>
<td align="center" valign="top">1.0</td>
<td align="center" valign="top">1.0</td>
<td align="center" valign="top">0.03</td>
<td align="center" valign="top">0.12</td>
<td align="center" valign="top">0.52</td>
<td align="center" valign="top">0.03</td>
<td align="center" valign="top">0.49</td>
<td align="center" valign="top">0.67</td>
<td align="center" valign="top">0.51</td>
<td align="center" valign="top">0.5</td>
<td align="center" valign="top">1.0</td>
</tr>
<tr>
<td align="left" valign="top">RF</td>
<td align="center" valign="top">0.89</td>
<td align="center" valign="top">0.91</td>
<td align="center" valign="top">0.9</td>
<td align="center" valign="top">0.89</td>
<td align="center" valign="top">0.79</td>
<td align="center" valign="top">0.96</td>
<td align="center" valign="top">0.79</td>
<td align="center" valign="top">0.09</td>
<td align="center" valign="top">0.9</td>
<td align="center" valign="top">0.9</td>
<td align="center" valign="top">0.89</td>
<td align="center" valign="top">0.9</td>
</tr>
<tr>
<td align="left" valign="top">SVM</td>
<td align="center" valign="top">0.49</td>
<td align="center" valign="top">0.0</td>
<td align="center" valign="top">1.0</td>
<td align="center" valign="top">0.0</td>
<td align="center" valign="top">0.0</td>
<td align="center" valign="top">0.66</td>
<td align="center" valign="top">0.0</td>
<td align="center" valign="top">0.23</td>
<td align="center" valign="top">0.66</td>
<td align="center" valign="top">0.49</td>
<td align="center" valign="top">0.49</td>
<td align="center" valign="top">1.0</td>
</tr>
<tr>
<td align="left" valign="top">XGBoost</td>
<td align="center" valign="top">0.86</td>
<td align="center" valign="top">0.97</td>
<td align="center" valign="top">0.97</td>
<td align="center" valign="top">0.84</td>
<td align="center" valign="top">0.82</td>
<td align="center" valign="top">0.98</td>
<td align="center" valign="top">0.81</td>
<td align="center" valign="top">0.07</td>
<td align="center" valign="top">0.91</td>
<td align="center" valign="top">0.91</td>
<td align="center" valign="top">0.86</td>
<td align="center" valign="top">0.97</td>
</tr>
<tr>
<td align="left" valign="top">LogisticRegression</td>
<td align="center" valign="top">0.49</td>
<td align="center" valign="top">0.0</td>
<td align="center" valign="top">1.0</td>
<td align="center" valign="top">0.0</td>
<td align="center" valign="top">0.0</td>
<td align="center" valign="top">0.66</td>
<td align="center" valign="top">0.0</td>
<td align="center" valign="top">0.34</td>
<td align="center" valign="top">0.66</td>
<td align="center" valign="top">0.49</td>
<td align="center" valign="top">0.49</td>
<td align="center" valign="top">1.0</td>
</tr>
</tbody>
</table>
</table-wrap>
<fig position="float" id="fig1">
<label>Figure 1</label>
<caption>
<p>ROC curve of the diabetes model.</p>
</caption>
<graphic xlink:href="fpubh-13-1509458-g001.tif"/>
</fig>
<fig position="float" id="fig2">
<label>Figure 2</label>
<caption>
<p>ROC curves of the cancer model.</p>
</caption>
<graphic xlink:href="fpubh-13-1509458-g002.tif"/>
</fig>
<fig position="float" id="fig3">
<label>Figure 3</label>
<caption>
<p>DCA curves of the diabetic model.</p>
</caption>
<graphic xlink:href="fpubh-13-1509458-g003.tif"/>
</fig>
<fig position="float" id="fig4">
<label>Figure 4</label>
<caption>
<p>DCA curves of the cancer model.</p>
</caption>
<graphic xlink:href="fpubh-13-1509458-g004.tif"/>
</fig>
<p>The ROC curve (Receiver Operating Characteristic Curve) measures the model&#x2019;s discriminatory ability at various thresholds by plotting the trade-off between the True Positive Rate (TPR) and False Positive Rate (FPR). It is insensitive to the proportion of positive and negative samples and is ideal for evaluating binary classification models comprehensively. The DCA curve is typically used to assess the &#x201C;net benefit&#x201D; of a model in practical clinical applications, taking into account the risk&#x2013;benefit balance at different thresholds. Net benefit is a metric that combines the risks of false positives and false negatives. A high net benefit indicates that the model effectively identifies the disease at that threshold, with a greater contribution compared to the cost of incorrect predictions. The threshold refers to the probability cutoff used by the decision model, which determines whether a sample is classified as positive. A higher threshold reduces false positives but may miss some true positives (i.e., increasing false negatives). We need to select the model that provides higher net benefit across a broader range of thresholds. The best-performing model was selected, and SHAP values were computed and plotted in summary graphs (<xref ref-type="fig" rid="fig5">Figures 5</xref>, <xref ref-type="fig" rid="fig6">6</xref>) to report the contribution of each feature. Partial dependence plots (<xref ref-type="fig" rid="fig7">Figures 7</xref>&#x2013;<xref ref-type="fig" rid="fig9">9</xref>) were used to visualize the impact of changes in aging-related genetic biomarkers on the outcomes.</p>
<fig position="float" id="fig5">
<label>Figure 5</label>
<caption>
<p>Summary plot of SHAP values for the diabetes model.</p>
</caption>
<graphic xlink:href="fpubh-13-1509458-g005.tif"/>
</fig>
<fig position="float" id="fig6">
<label>Figure 6</label>
<caption>
<p>Summary plot of SHAP values for the cancer model.</p>
</caption>
<graphic xlink:href="fpubh-13-1509458-g006.tif"/>
</fig>
<fig position="float" id="fig7">
<label>Figure 7</label>
<caption>
<p>Cancer PACKYSMort partial dependence plot.</p>
</caption>
<graphic xlink:href="fpubh-13-1509458-g007.tif"/>
</fig>
<fig position="float" id="fig8">
<label>Figure 8</label>
<caption>
<p>Diabetes ratio of poverty partial dependence plot.</p>
</caption>
<graphic xlink:href="fpubh-13-1509458-g008.tif"/>
</fig>
<fig position="float" id="fig9">
<label>Figure 9</label>
<caption>
<p>Diabetes logA1CMort partial dependence plot.</p>
</caption>
<graphic xlink:href="fpubh-13-1509458-g009.tif"/>
</fig>
</sec>
</sec>
<sec sec-type="results" id="sec10">
<label>3</label>
<title>Results</title>
<sec id="sec11">
<label>3.1</label>
<title>Baseline table</title>
<p><xref ref-type="table" rid="tab3">Table 3</xref> the diabetes model included a total of 2,205 participants, with 394 diabetic patients, the majority of whom were of other Hispanic descent. The average age of diabetic patients was 66.6&#x202F;years (SD 8.99), significantly higher than that of non-diabetic patients, which was 65.6&#x202F;years (SD 10.1), <italic>p</italic>&#x202F;=&#x202F;0.048, indicating that age is an important risk factor for tumor occurrence. There was also a significant difference in racial distribution between the two groups (<italic>p</italic>&#x202F;&#x003C;&#x202F;0.001). The proportion of Mexican Americans (34.3%) and other Hispanics (27.1%) was significantly higher in diabetic patients compared to non-diabetic patients (26.6 and 19.7%, respectively), while the proportion of non-Hispanic Blacks was significantly lower in diabetic patients (26.9%) compared to non-diabetic patients (44.2%), indicating a significant racial difference in tumor incidence. The proportion of diabetic patients with a high school education or higher was significantly lower than that of non-diabetic patients (66.5% vs. 75.0%, <italic>p</italic>&#x202F;=&#x202F;0.001). In addition, the prevalence of hypertension was significantly higher in diabetic patients compared to non-diabetic patients (65.0% vs. 43.8%, <italic>p</italic>&#x202F;&#x003C;&#x202F;0.001). There was no significant difference in marital status distribution between the two groups (<italic>p</italic>&#x202F;=&#x202F;0.918). Age-related indicators: All biological age markers (such as HorvathAge, HannumAge, PhenoAge, etc.) in the diabetic group were significantly higher than those in the non-diabetic group (<italic>p</italic>&#x202F;&#x003C;&#x202F;0.05). Indicators such as HorvathAge acceleration, HannumAge acceleration, SkinBloodAge acceleration, PhenoAge acceleration, ZhangAge acceleration, and LinAge acceleration showed significant differences in diabetic patients (<italic>p</italic>&#x202F;&#x003C;&#x202F;0.05), While some age acceleration indicators, such as WeidnerAge acceleration and VidalBraloAge acceleration, showed no significant differences in diabetic patients (<italic>p</italic>&#x202F;&#x003E;&#x202F;0.05). Indicators such as GDF15Mort, B2MMort, CystatinCMort, TIMP1Mort, ADMMort, PAI1Mort, LeptinMort, CRPMort, logA1CMort, GrimAgeMort, GrimAge2Mort, and YangCell were significantly higher in diabetic patients than in non-diabetic patients (<italic>p</italic>&#x202F;&#x003C;&#x202F;0.05). Indicators such as PACKYRSMort, HorvathTelo, DunedinPoAm, CD8TPP, CD4TPP, Nkcell, Bcell, MonoPP, and NeuPP showed no significant differences between the two groups (<italic>p</italic>&#x202F;&#x003E;&#x202F;0.05).</p>
<p><xref ref-type="table" rid="tab2">Table 2</xref> the cancer model included a total of 1,291 participants, with 177 cancer patients, primarily distributed among non-Hispanic Black individuals. The average age of cancer patients (69.1&#x202F;years, SD 10.00) was significantly higher than that of non-cancer patients (63.8&#x202F;years, SD 9.69), <italic>p</italic>&#x202F;&#x003C;&#x202F;0.001. The proportion of cancer patients with a high school education or higher (86.2%) was significantly higher than that of non-cancer patients (79.1%), <italic>p</italic>&#x202F;=&#x202F;0.039. There was a significant difference in racial distribution between the two groups (<italic>p</italic>&#x202F;&#x003C;&#x202F;0.001). Among non-cancer patients, the proportion of non-Hispanic Black individuals was relatively low (42.4%), while this proportion significantly increased to 68.4% in cancer patients. Additionally, the proportion of Mexican Americans, other Hispanics, and other ethnic groups was significantly lower among cancer patients. There was no significant difference between the two groups in terms of marital status (Marry), prevalence of hypertension (Hypertension), and incidence of diabetes (Diabetes). All age clock indicators (such as HorvathAge, HannumAge, SkinBloodAge, PhenoAge, ZhangAge, LinAge, WeidnerAge, VidalBraloAge, etc.) were significantly higher in cancer patients than in non-cancer patients (<italic>p</italic>&#x202F;&#x003C;&#x202F;0.001). ZhangAge acceleration: Cancer patients had significantly lower values than non-cancer patients (<italic>p</italic>&#x202F;&#x003C;&#x202F;0.001). WeidnerAge acceleration (<italic>p</italic>&#x202F;=&#x202F;0.027) and VidalBraloAge acceleration (<italic>p</italic>&#x202F;=&#x202F;0.020): The acceleration markers in cancer patients were significantly different from those in non-cancer patients. Other age acceleration markers (such as HorvathAge acceleration, HannumAge acceleration, etc.) showed no significant differences (<italic>p</italic>&#x202F;&#x003E;&#x202F;0.05). Indicators such as GDF15Mort, B2MMort, CystatinCMort, TIMP1Mort, ADMMort, PACKYRSMort, GrimAgeMort, GrimAge2Mort, HorvathTelo, DunedinPoAm, CD4TPP, and NeuPP were significantly higher in cancer patients than in non-cancer patients (<italic>p</italic>&#x202F;&#x003C;&#x202F;0.05). Indicators such as LeptinMort, CRPMort, logA1CMort, YangCell, CD8TPP, Nkcell, Bcell, and MonoPP showed no significant differences between the two groups (<italic>p</italic>&#x202F;&#x003E;&#x202F;0.05), suggesting that these markers may not have a direct association with tumor incidence in this study, or their mechanisms of action are complex and require further exploration with larger sample sizes or multivariate analyses.</p>
</sec>
<sec id="sec12">
<label>3.2</label>
<title>Epigenetic age clocks</title>
<p>Correlation analysis shows that the correlation coefficients between eight epigenetic ages and chronological age are all greater than 0.5 (<xref ref-type="table" rid="tab7">Table 7</xref>), indicating that they are all strongly positively correlated with age, thus confirming the reliability of these clocks.</p>
<table-wrap position="float" id="tab7">
<label>Table 7</label>
<caption>
<p>Correlation analysis of chronological age and epigenetic age.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top">Variable</th>
<th align="center" valign="top">Correlation coefficient</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="middle">HorvathAge</td>
<td align="center" valign="middle">0.847</td>
</tr>
<tr>
<td align="left" valign="middle">HannumAge</td>
<td align="center" valign="middle">0.861</td>
</tr>
<tr>
<td align="left" valign="middle">SkinBloodAge</td>
<td align="center" valign="middle">0.910</td>
</tr>
<tr>
<td align="left" valign="middle">PhenoAge</td>
<td align="center" valign="middle">0.804</td>
</tr>
<tr>
<td align="left" valign="middle">ZhangAge</td>
<td align="center" valign="middle">0.930</td>
</tr>
<tr>
<td align="left" valign="middle">LinAge</td>
<td align="center" valign="middle">0.811</td>
</tr>
<tr>
<td align="left" valign="middle">WeidnerAge</td>
<td align="center" valign="middle">0.571</td>
</tr>
<tr>
<td align="left" valign="middle">VidalBraloAge</td>
<td align="center" valign="middle">0.662</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>Further heatmap analysis was performed to examine the correlation between epigenetic age acceleration (epigenetic age &#x2013; chronological age) and diabetes, as well as cancer (<xref ref-type="fig" rid="fig10">Figures 10</xref>, <xref ref-type="fig" rid="fig11">11</xref>). These two heatmaps display the partial correlation coefficients between diseases (diabetes and cancer) and epigenetic age clock acceleration, illustrating the independent correlations between each disease and different age acceleration factors. Partial correlation refers to the correlation coefficient for each number, representing the partial correlation between a specific disease (diabetes or cancer) and a particular age acceleration factor. Positive correlation (red): A positive coefficient indicates that the disease is positively correlated with the acceleration factor (the higher the acceleration factor, the higher the disease risk). Negative correlation (blue): A negative coefficient indicates that the disease is negatively correlated with the acceleration factor (the higher the acceleration factor, the lower the disease risk). Close to 0 (gray): No significant correlation. In the heatmap, the colors range from red (positive correlation) to blue (negative correlation), with gray indicating weak correlations.</p>
<fig position="float" id="fig10">
<label>Figure 10</label>
<caption>
<p>Epigenetic age acceleration correlation heatmaps.</p>
</caption>
<graphic xlink:href="fpubh-13-1509458-g010.tif"/>
</fig>
<fig position="float" id="fig11">
<label>Figure 11</label>
<caption>
<p>Epigenetic age acceleration correlation heatmaps.</p>
</caption>
<graphic xlink:href="fpubh-13-1509458-g011.tif"/>
</fig>
<p>The partial correlation coefficients are generally close to 0, indicating that there is almost no significant independent correlation between diabetes and these epigenetic age clock accelerations. The differences in the effects of each acceleration factor on diabetes are minimal and not statistically significant.</p>
<p><xref ref-type="fig" rid="fig10">Figure 10</xref> LinAge acceleration and ZhangAge acceleration show a weak negative correlation with cancer (&#x2212;0.19), suggesting that these two acceleration factors may be associated with a reduced risk of cancer. VidalBraloAge acceleration and HannumAge acceleration show a weak positive correlation with cancer (0.10 and 0.05, respectively), indicating that these epigenetic age clock accelerations may be associated with an increased risk of cancer. Other acceleration factors (such as HorvathAge, SkinBloodAge, etc.) show a correlation close to 0 with cancer.</p>
</sec>
<sec id="sec13">
<label>3.3</label>
<title>Development and performance of risk models</title>
<p>After calculating evaluation metrics and plotting the ROC and DCA curves, this study assesses model performance using multiple indicators, with detailed evaluation values provided in <xref ref-type="table" rid="tab5">Tables 5</xref>, <xref ref-type="table" rid="tab6">6</xref>, which present the performance evaluation of the diabetes and cancer prediction models. This study plots the ROC curves for various models of diabetes and cancer. According to the definition of the ROC curve, as the threshold changes, the curve should ideally be as &#x201C;convex&#x201D; as possible toward the top-left corner. Regions with high TPR and low FPR indicate better classifier performance, so LightGBM is chosen as the model with the best performance. Models with higher DCA curves indicate greater net benefit at the corresponding threshold probabilities, thus demonstrating superior performance. Different models may perform differently across different threshold ranges. For example, in the low threshold range (&#x003C;0.2), some models (such as Logistic Regression and LightGBM) may have higher net benefits. In the middle range (0.2&#x2013;0.6), models like Gradient Boosting and RF may outperform others. At high thresholds (&#x003E;0.7), the net benefit of the models may approach that of the &#x201C;Treat None&#x201D; strategy (no intervention). The reference significance of &#x201C;Treat All&#x201D; and &#x201C;Treat None&#x201D;: &#x201C;Treat All&#x201D; is an extreme strategy where all patients are treated. &#x201C;Treat None&#x201D; is another extreme strategy where no patient receives intervention. When the model&#x2019;s curve lies between &#x201C;Treat All&#x201D; and &#x201C;Treat None,&#x201D; it indicates that the model&#x2019;s prediction lacks clinical value. Selection of the optimal model: Considering the overall threshold range, the model that consistently stays above &#x201C;Treat All&#x201D; and &#x201C;Treat None&#x201D; while covering a broader threshold probability range is the optimal choice. From this DCA curve, it is observed that Gradient Boosting and LightGBM demonstrate superior net benefits across larger threshold ranges. This study evaluates model performance using various indicators, with detailed evaluation values provided in <xref ref-type="table" rid="tab5">Tables 5</xref>, <xref ref-type="table" rid="tab6">6</xref>, which present the performance evaluation of the diabetes and cancer prediction models. In the diabetes prediction, LightGBM achieved an AUC of 1.00, an MCC of 0.97, and an F1 Score of 0.98 on the validation set, while GBM had an AUC of 0.99, an MCC of 0.93, and an F1 Score of 0.95 (<xref ref-type="table" rid="tab5">Table 5</xref>). LightGBM is thus selected as the best model. Similarly, in cancer prediction, LightGBM achieved an AUC of 0.98, an MCC of 0.83, and an F1 Score of 0.91 (<xref ref-type="table" rid="tab6">Table 6</xref>). Therefore, it can be concluded that the LightGBM model is the best comprehensive model for assessing the risk of diabetes and cancer, and is selected for use.</p>
<p>The SHAP value summary plot reports that the top three contributing features in the diabetes model are logA1Mort, family income-to-poverty ratio, and marital status (<xref ref-type="fig" rid="fig5">Figure 5</xref>). In the cancer model, the top three contributing features are gender, non-Hispanic white, and PACKYRSMort (<xref ref-type="fig" rid="fig6">Figure 6</xref>). Based on the above SHAP value summary plot, partial dependence plots for important features were drawn. An increase in logA1Mort is positively correlated with the risk of diabetes (<xref ref-type="fig" rid="fig9">Figure 9</xref>). When the economic status of the subjects is poorer (such as when the family income-to-poverty ratio is close to 0 or 1), the probability of developing diabetes is higher. When the family income-to-poverty ratio is between 1 and 4, the partial dependence values stabilize, and there is no significant fluctuation in diabetes risk. When the poverty ratio exceeds 4, the partial dependence values sharply decrease, suggesting that a higher poverty ratio (better economic status) may be associated with a lower risk of diabetes (<xref ref-type="fig" rid="fig8">Figure 8</xref>). On the other hand, <xref ref-type="fig" rid="fig7">Figure 7</xref> shows that PACKYRSMort is non-linearly related to cancer risk. When the cumulative smoking burden is less than 10, the risk of cancer is relatively low. When the cumulative smoking burden is between 10 and 30, the risk of cancer significantly increases. When the cumulative smoking burden exceeds 30, the risk of cancer shows a declining trend.</p>
</sec>
</sec>
<sec sec-type="discussion" id="sec14">
<label>4</label>
<title>Discussion</title>
<sec id="sec15">
<label>4.1</label>
<title>Epigenetic age clock</title>
<p>Epigenetic clocks rely on DNA methylation (DNAm) analysis at specific CpG sites to predict an individual&#x2019;s chronological age with high accuracy (<xref ref-type="bibr" rid="ref11">11</xref>). Additionally, epigenetic age acceleration&#x2014;the discrepancy between chronological age and epigenetic age&#x2014;is increasingly recognized as a marker of aging, capable of predicting premature onset of diseases and early mortality (<xref ref-type="bibr" rid="ref12">12</xref>). When applied to large-scale human epidemiological datasets, research has shown that the gap between predicted epigenetic age and actual chronological age is linked to various age-related diseases, particularly when epigenetic age surpasses chronological age. There is growing evidence supporting the notion that accelerated epigenetic aging serves as a novel biomarker for cancer risk. A study by Plonski et al. (<xref ref-type="bibr" rid="ref13">13</xref>) found that epigenetic age acceleration correlates with late-stage mortality in both cancer and chronic diseases. Similarly, research by Zheng et al. (<xref ref-type="bibr" rid="ref24">24</xref>) demonstrated a statistically significant positive correlation between epigenetic age acceleration and overall mortality, highlighting its role as a key predictor of colorectal cancer survival. Levine et al. (<xref ref-type="bibr" rid="ref25">25</xref>) further suggested that accelerated epigenetic aging could serve as a useful biomarker for assessing lung cancer susceptibility. In the present study, univariate analysis revealed that all epigenetic clocks (including HorvathAge, HannumAge, PhenoAge, and others) were significantly elevated in cancer patients compared to non-cancer controls. Heatmap analysis also identified a weak negative correlation (&#x2212;0.19) between LinAge acceleration and ZhangAge acceleration with cancer risk, suggesting that these two forms of epigenetic age acceleration might be associated with a lower cancer risk. Conversely, VidalBraloAge acceleration and HannumAge acceleration showed weak positive correlations (0.10 and 0.05, respectively) with cancer, indicating that these epigenetic age accelerations may be linked to an increased cancer risk. These findings support the conclusion that epigenetic age acceleration is potentially associated with cancer risk. Consistent with previous studies (<xref ref-type="bibr" rid="ref14">14</xref>), which have suggested that epigenetic age accelerations, such as Horvath acceleration, Hannum acceleration, and Grim acceleration, can predict cancer mortality, the results reinforce the role of epigenetic age acceleration in cancer outcomes.</p>
<p>In this study, various epigenetic age acceleration markers, including HorvathAge accelerations, HannumAge accelerations, SkinBloodAge accelerations, PhenoAge accelerations, ZhangAge accelerations, and LinAge accelerations, exhibited significant differences in diabetic patients (<italic>p</italic>&#x202F;&#x003C;&#x202F;0.05). However, there was little to no significant independent correlation between diabetes and these accelerations of epigenetic age clocks. Previous research (<xref ref-type="bibr" rid="ref8">8</xref>) has also shown that epigenetic age is linked to the mortality risk in individuals with type 2 diabetes. Vetter et al. (<xref ref-type="bibr" rid="ref26">26</xref>) noted that after adjusting for covariates, no significant cross-sectional association was found between epigenetic age acceleration and the diagnosis of diabetes. On the other hand, longitudinal analysis indicated that in male diabetic participants, each additional year of 7-CpG DNAm acceleration at baseline was associated with an 11% increased likelihood of developing new diabetes-related complications or exacerbating pre-existing complications during the follow-up period. A separate longitudinal study conducted among twins (<xref ref-type="bibr" rid="ref27">27</xref>) found a positive correlation between blood glucose levels and epigenetic age markers. As this study is cross-sectional, it did not perform longitudinal comparisons, suggesting that future research should explore the relationship between epigenetic age and diabetes in more depth through longitudinal studies. Furthermore, due to sample limitations in the database, diabetes was not categorized in this study, highlighting the need for more detailed research with categorized data and larger sample sizes in future investigations.</p>
</sec>
<sec id="sec16">
<label>4.2</label>
<title>The relationship between other epigenetic materials and diseases</title>
<p>In this study, epigenetic markers such as GDF15Mort, B2MMort, CystatinCMort, TIMP1Mort, ADMMort, PACKYRSMort, GrimAgeMort, GrimAge2Mort, HorvathTelo, DunedinPoAm, CD4TPP, and NeuPP were significantly higher in cancer patients compared to non-cancer patients (<italic>p</italic>&#x202F;&#x003C;&#x202F;0.05). These biomarkers are involved in key cellular processes, such as cell cycle regulation, inflammatory response, apoptosis, and gene expression regulation, all of which play crucial roles in cancer development and progression. GDF15 promotes tumor cell invasion and metastasis by regulating cell migration and apoptosis (<xref ref-type="bibr" rid="ref28">28</xref>). High expression of GDF15 in various cancer types is associated with tumor invasiveness and poor prognosis (<xref ref-type="bibr" rid="ref29">29</xref>). TIMP1 as a matrix metalloproteinase inhibitor, TIMP1 regulates matrix remodeling in the tumor microenvironment and promotes tumor metastasis (<xref ref-type="bibr" rid="ref30">30</xref>, <xref ref-type="bibr" rid="ref31">31</xref>). Elevated levels of TIMP1 are linked to poor prognosis in multiple cancers (<xref ref-type="bibr" rid="ref32 ref33 ref34">32&#x2013;34</xref>).</p>
</sec>
<sec id="sec17">
<label>4.3</label>
<title>Diabetes risk assessment model</title>
<p>This study employed machine learning techniques to analyze the relationship between 30 epigenetic biomarkers and the risks of diabetes and cancer, and it visualized the association between the most influential biomarkers and the outcomes. In the diabetes risk assessment model, the top three most important features identified were logA1Mort, the household income to poverty ratio, and marital status. Among these, logA1Mort demonstrated a linear relationship with the onset of diabetes, where its increase was positively correlated with an elevated risk of diabetes. LogA1Mort refers to the log-transformed glycated hemoglobin value derived from DNA methylation (<xref ref-type="bibr" rid="ref35">35</xref>), and evidence indicates that it is strongly correlated with insulin, triglyceride, and glucose levels, as well as with insulin sensitivity and glucose metabolism (<xref ref-type="bibr" rid="ref35">35</xref>). Importantly, studies have shown that for each standard deviation increase in logA1Mort, the risk ratio for coronary heart disease rises by approximately 30% (<xref ref-type="bibr" rid="ref35">35</xref>). These findings suggest that logA1Mort could serve as a valuable biomarker for predicting diabetes, particularly in the context of an aging population. Integrating age with epigenetic biomarkers could facilitate the identification of high-risk groups, enabling earlier interventions. This study is the first to quantify the contribution of logA1Mort in diabetes prediction using machine learning techniques. By incorporating machine learning models alongside 30 epigenetic biomarkers, we were able to more accurately assess the contribution of these biomarkers to diabetes risk, offering a novel approach for early diabetes screening.</p>
<p>In this study, a poorer economic status, as indicated by a household income-to-poverty ratio close to 0 or 1, was associated with a higher likelihood of developing diabetes. When the household income-to-poverty ratio ranged from 1 to 4, the partial dependence values stabilized, showing no significant fluctuations in diabetes risk. However, when the poverty ratio exceeded 4, the partial dependence values sharply decreased, suggesting that a higher poverty ratio (which reflects better economic status) may be linked to a reduced risk of developing diabetes. The household income-to-poverty ratio, as a proxy for socioeconomic status, has been demonstrated in several studies to significantly influence both the incidence and prognosis of diabetes (<xref ref-type="bibr" rid="ref36">36</xref>). This study further highlights the predictive role of income and poverty ratio in assessing diabetes risk, particularly in low-income groups, where both the incidence and mortality rates of diabetes are higher. Socioeconomic factors can elevate the risk of diabetes by influencing behaviors related to health, access to healthcare, and other factors. Therefore, future diabetes prevention and intervention strategies should take these socioeconomic variables into account, with a particular focus on enhancing early screening and health education for low-income populations.</p>
<p>In this study, marital status is also one of the important features in the diabetes model. Studies have pointed out (<xref ref-type="bibr" rid="ref37">37</xref>) that for minority men and non-Hispanic white men, divorce/separation status is significantly associated with diabetes mortality, while for minority women and non-Hispanic white women, widowhood status is significantly associated with diabetes mortality. Some studies have shown (<xref ref-type="bibr" rid="ref38">38</xref>, <xref ref-type="bibr" rid="ref39">39</xref>) that the impact of marital status on diabetes mortality differs by gender.</p>
</sec>
<sec id="sec18">
<label>4.4</label>
<title>Cancer risk assessment model</title>
<p>In the cancer risk assessment model, gender, non-Hispanic White ethnicity, and PACKYRSMort were identified as the top three important features. Among these, gender was found to be one of the most significant contributing factors, which aligns with existing literature, underscoring gender as a critical element in cancer risk prediction. The incidence of various cancers shows notable differences between males and females. Several studies have indicated (<xref ref-type="bibr" rid="ref40">40</xref>) that men generally exhibit a higher incidence of various cancer types compared to women, particularly cancers that are strongly linked to smoking and alcohol consumption, such as lung cancer, esophageal cancer, and metastatic cancers. Due to differences in endocrine functions, immune system responses, and other factors such as physical activity, men tend to have higher susceptibility to these cancers. For instance, in the case of lung cancer (<xref ref-type="bibr" rid="ref41">41</xref>), men face a significantly higher risk compared to women, especially among smokers. Although smoking rates have decreased among women, the incidence of lung cancer in women has risen in recent years, which may be attributed to factors such as women&#x2019;s smoking levels, genetic predispositions, and gender-specific differences in smoking behaviors. Conversely, breast cancer incidence is substantially higher in women than in men (<xref ref-type="bibr" rid="ref42">42</xref>, <xref ref-type="bibr" rid="ref43">43</xref>), a difference closely tied to the role of estrogen in the female body. Estrogen promotes the development and lactation of breast tissue, and prolonged exposure to this hormone may increase the risk of developing breast cancer.</p>
<p>There is substantial evidence that habitual smoking is a major risk factor for immune-mediated inflammatory diseases and various cancers (<xref ref-type="bibr" rid="ref44">44</xref>). Specifically, smoking is a major risk factor for head and neck cancers and lung cancer (<xref ref-type="bibr" rid="ref45">45</xref>). Approximately 90% of lung cancer cases are directly related to smoking (<xref ref-type="bibr" rid="ref46">46</xref>). Smoking is also closely linked to bladder cancer, pancreatic cancer, and renal pelvic cancer. Smoking is also associated with the etiology of colon cancer, liver cancer, and stomach cancer (<xref ref-type="bibr" rid="ref45">45</xref>, <xref ref-type="bibr" rid="ref46">46</xref>). Existing data clearly indicate that smoking increases the risk of cancer in multiple organs (<xref ref-type="bibr" rid="ref47">47</xref>) and often leads to premature death. The five-year survival rate for lung cancer is very low, only 15%. Other smoking-related cancers, such as liver cancer and pancreatic cancer, also have low five-year survival rates (18 and 9%, respectively). PACKYRSMort is a composite biomarker for estimating pack-years of smoking, proposed by Ake T. Lu based on DNA methylation (<xref ref-type="bibr" rid="ref17">17</xref>). Our study shows that PACKYRSMort has a nonlinear relationship with cancer risk. When the cumulative smoking burden is &#x003C;10, the risk of cancer is relatively low. When the cumulative smoking burden is between 10 and 30, the risk of cancer significantly increases. When the cumulative smoking burden is &#x003E;30, the risk of cancer begins to decline. Our results differ from other studies. Rota et al. (<xref ref-type="bibr" rid="ref48">48</xref>) quantified the dose&#x2013;response relationship between smoking and gastric cancer risk and found that smoking is not only an independent risk factor for gastric cancer, but the risk increases with the number of cigarettes smoked daily, from a small amount to 20, and the risk increases in a dose-dependent manner with the duration of smoking. A meta-analysis by Lugo et al. showed that the risk of gallbladder cancer increases linearly with smoking intensity and duration (<xref ref-type="bibr" rid="ref49">49</xref>). In addition, the risk of breast cancer (<xref ref-type="bibr" rid="ref50">50</xref>) and cervical cancer (<xref ref-type="bibr" rid="ref51">51</xref>) has also been reported to be linearly associated with smoking intensity. Our study is consistent with previous research when the cumulative smoking burden is &#x2264;30, but when the cumulative smoking burden is &#x003E;30, cancer risk shows a certain degree of decline. This phenomenon requires further biological explanation. A possible explanation is that the carcinogenic risk brought by long-term smoking has pushed the individual&#x2019;s health status to the limit, and other health factors (such as immune decline, organ failure, etc.) may begin to significantly affect their cancer risk. Additionally, long-term smoking may alter DNA methylation patterns (<xref ref-type="bibr" rid="ref52">52</xref>, <xref ref-type="bibr" rid="ref53">53</xref>), leading to the suppression or activation of certain gene expressions, thus affecting the mechanisms of cancer development.</p>
<p>In the cancer prediction model, the non-Hispanic White population emerged as a key sociodemographic factor, underscoring the significant role of race and cultural background in cancer risk prediction. Previous studies have shown (<xref ref-type="bibr" rid="ref54">54</xref>) that, compared to non-Hispanic White individuals, Hispanic men and women experienced 25&#x2013;30% lower cancer incidence (2014&#x2013;2018) and mortality rates (2015&#x2013;2019), with a notably lower incidence of common cancers. This study further substantiates the relevance of this group in the cancer model, highlighting the potential influence of racial differences on cancer susceptibility. These findings not only enhance our understanding of cancer risk prediction but also lay the groundwork for future personalized risk assessments. By integrating epigenetic biomarkers (such as PACKYRSMort) with sociodemographic factors (such as gender and non-Hispanic White ethnicity), we can more accurately identify high-risk populations, particularly in contexts where gender, race, and socioeconomic factors intersect. These results offer both theoretical support for personalized cancer prevention strategies and data-driven insights that can inform public health policy development.</p>
</sec>
</sec>
<sec id="sec19">
<label>5</label>
<title>Limitations and future directions</title>
<p>Although this study has made significant progress in exploring the relationship between epigenetic biomarkers and the risk of diabetes and cancer, and has successfully developed relevant predictive models, several limitations remain. These limitations highlight important areas for improvement and provide a clear direction for future research.</p>
<p>Firstly, although this study is based on a large amount of epigenetic data, the data is sourced from a single NHANES database. The types of diabetes and cancer are not further categorized, and the data is geographically limited to North America. Additionally, there are missing data points within the dataset, leading to sample imbalances. While standardization and other balancing techniques were applied during data processing, some bias remains inevitable. Therefore, future validation with external cohorts and additional cohort studies would be helpful for further analysis. Expanding data collection and analysis to include diverse regions, races, and cultural backgrounds would improve the model&#x2019;s applicability and external validity.</p>
<p>Secondly, this study mainly relies on existing epigenetic clocks and machine learning techniques for risk prediction. While these methods have demonstrated their effectiveness in certain aspects, there is still significant potential for improvement in terms of algorithm complexity and predictive accuracy. For instance, training machine learning models requires large volumes of high-quality data, and challenges such as reducing data bias, addressing data loss, and improving feature selection accuracy remain critical areas for improvement. Additionally, the interpretability of these models is another key concern, particularly in the medical field, where it is essential to understand and explain the model&#x2019;s predictions for clinical applications. Therefore, future research should place greater emphasis on enhancing the interpretability of these models, with a particular focus on integrating biological contexts to clarify the roles of various epigenetic biomarkers in disease prediction.</p>
<p>Thirdly, while epigenetic biomarkers offer promising new biological indicators for early regulation and risk assessment of diabetes and cancer, the genetic mechanisms involved are highly complex and operate across multiple regulatory levels. Single markers, such as specific DNA methylation sites or epigenetic age clocks, may not fully capture the underlying biological processes. To address this limitation, future research should incorporate multidimensional analyses that combine epigenetic biomarkers with other molecular markers, such as genetic mutations, proteomics, and transcriptomics. This multi-omics approach would provide a more comprehensive understanding of an individual&#x2019;s aging process and enhance the accuracy of disease risk predictions.</p>
<p>Additionally, as a cross-sectional study, this research is limited in its ability to establish causal relationships and may be influenced by age-related effects or selection bias. To overcome these limitations, future research should consider conducting longitudinal studies to track changes in epigenetic biomarkers over time. This approach would help clarify causal relationships between epigenetic changes and disease development, providing a more dynamic understanding of how these biomarkers contribute to the progression of diseases such as diabetes and cancer.</p>
</sec>
<sec sec-type="conclusions" id="sec20">
<label>6</label>
<title>Conclusion</title>
<p>This study is the first to combine epigenetic age acceleration with risk assessment of diabetes and cancer, and conducted a comprehensive analysis using machine learning models. The results indicate that epigenetic age acceleration is closely associated with cancer risk, but has a weaker relationship with diabetes. Through machine learning methods, the top three contributing features in the diabetes model are logA1Mort, household income-to-poverty ratio, and marital status, with an increase in logA1Mort being positively correlated with diabetes risk. In the cancer model, the top three contributing features are gender, non-Hispanic White ethnicity, and PACKYRSMort, with PACKYRSMort showing a nonlinear relationship with cancer risk.</p>
</sec>
</body>
<back>
<sec sec-type="data-availability" id="sec21">
<title>Data availability statement</title>
<p>Publicly available datasets were analyzed in this study. The data can be accessed from the NHANES Database at: <ext-link xlink:href="https://www.cdc.gov/nchs/nhanes/index.htm" ext-link-type="uri">https://www.cdc.gov/nchs/nhanes/index.htm</ext-link>.</p>
</sec>
<sec sec-type="ethics-statement" id="sec95">
<title>Ethics statement</title>
<p>This study was based on publicly available datasets. Ethical review and approval was not required for the study, in accordance with the local legislation and institutional requirements.</p>
</sec>
<sec sec-type="author-contributions" id="sec22">
<title>Author contributions</title>
<p>SZ: Conceptualization, Data curation, Formal analysis, Writing &#x2013; review &#x0026; editing. JJ: Conceptualization, Data curation, Writing &#x2013; original draft. BX: Writing &#x2013; review &#x0026; editing, Software. QZ: Investigation, Methodology, Validation, Writing &#x2013; original draft. HM: Data curation, Visualization, Writing &#x2013; original draft.</p>
</sec>
<sec sec-type="funding-information" id="sec23">
<title>Funding</title>
<p>The author(s) declare that no financial support was received for the research and/or publication of this article.</p>
</sec>
<ack>
<p>We express our gratitude to the participants and staff of the National Health and Nutrition Examination Survey (NHANES) from 2011 to 2018 for their valuable contributions.</p>
</ack>
<sec sec-type="COI-statement" id="sec24">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="ai-statement" id="sec25">
<title>Generative AI statement</title>
<p>The authors declare that no Gen AI was used in the creation of this manuscript.</p>
</sec>
<sec sec-type="disclaimer" id="sec26">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<ref-list>
<title>References</title>
<ref id="ref1"><label>1.</label><citation citation-type="journal"><person-group person-group-type="author"><collab id="coll1">GBD 2021 Diabetes Collaborators</collab></person-group>. <article-title>Global, regional, and national burden of diabetes from 1990 to 2021, with projections of prevalence to 2050: a systematic analysis for the global burden of disease study 2021</article-title>. <source>Lancet</source>. (<year>2023</year>) <volume>402</volume>:<fpage>203</fpage>&#x2013;<lpage>34</lpage>. doi: <pub-id pub-id-type="doi">10.1016/S0140-6736(23)01301-6</pub-id>, PMID: <pub-id pub-id-type="pmid">37356446</pub-id></citation></ref>
<ref id="ref2"><label>2.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bray</surname> <given-names>F</given-names></name> <name><surname>Laversanne</surname> <given-names>M</given-names></name> <name><surname>Sung</surname> <given-names>H</given-names></name> <name><surname>Ferlay</surname> <given-names>J</given-names></name> <name><surname>Siegel</surname> <given-names>RL</given-names></name> <name><surname>Soerjomataram</surname> <given-names>I</given-names></name> <etal/></person-group>. <article-title>Global cancer statistics 2022: Globocan estimates of incidence and mortality worldwide for 36 cancers in 185 countries</article-title>. <source>CA Cancer J Clin</source>. (<year>2024</year>) <volume>74</volume>:<fpage>229</fpage>&#x2013;<lpage>63</lpage>. doi: <pub-id pub-id-type="doi">10.3322/caac.21834</pub-id>, PMID: <pub-id pub-id-type="pmid">38572751</pub-id></citation></ref>
<ref id="ref3"><label>3.</label><citation citation-type="journal"><person-group person-group-type="author"><collab id="coll2">GBD 2021 Diseases and Injuries Collaborators</collab></person-group>. <article-title>Global incidence, prevalence, years lived with disability (Ylds), disability-adjusted life-years (Dalys), and healthy life expectancy (Hale) for 371 diseases and injuries in 204 countries and territories and 811 subnational locations, 1990-2021: a systematic analysis for the global burden of disease study 2021</article-title>. <source>Lancet</source>. (<year>2024</year>) <volume>403</volume>:<fpage>2133</fpage>&#x2013;<lpage>61</lpage>. doi: <pub-id pub-id-type="doi">10.1016/S0140-6736(24)00757-8</pub-id>, PMID: <pub-id pub-id-type="pmid">38642570</pub-id></citation></ref>
<ref id="ref4"><label>4.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Huang</surname> <given-names>Q</given-names></name> <name><surname>Han</surname> <given-names>L</given-names></name> <name><surname>Liu</surname> <given-names>Y</given-names></name> <name><surname>Wang</surname> <given-names>C</given-names></name> <name><surname>Duan</surname> <given-names>D</given-names></name> <name><surname>Lu</surname> <given-names>N</given-names></name> <etal/></person-group>. <article-title>Elevation of Ptpn 1 promoter methylation is a significant risk factor of type 2 diabetes in the Chinese population</article-title>. <source>Exp Ther Med</source>. (<year>2017</year>) <volume>14</volume>:<fpage>2976</fpage>&#x2013;<lpage>82</lpage>. doi: <pub-id pub-id-type="doi">10.3892/etm.2017.4924</pub-id>, PMID: <pub-id pub-id-type="pmid">29042909</pub-id></citation></ref>
<ref id="ref5"><label>5.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sheaffer</surname> <given-names>KL</given-names></name> <name><surname>Elliott</surname> <given-names>EN</given-names></name> <name><surname>Kaestner</surname> <given-names>KH</given-names></name></person-group>. <article-title>Dna Hypomethylation contributes to genomic instability and intestinal Cancer initiation</article-title>. <source>Cancer Prev Res (Phila)</source>. (<year>2016</year>) <volume>9</volume>:<fpage>534</fpage>&#x2013;<lpage>46</lpage>. doi: <pub-id pub-id-type="doi">10.1158/1940-6207.CAPR-15-0349</pub-id>, PMID: <pub-id pub-id-type="pmid">26883721</pub-id></citation></ref>
<ref id="ref6"><label>6.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sergeev</surname> <given-names>AV</given-names></name> <name><surname>Loiko</surname> <given-names>AG</given-names></name> <name><surname>Genatullina</surname> <given-names>AI</given-names></name> <name><surname>Petrov</surname> <given-names>AS</given-names></name> <name><surname>Kubareva</surname> <given-names>EA</given-names></name> <name><surname>Dolinnaya</surname> <given-names>NG</given-names></name> <etal/></person-group>. <article-title>Crosstalk between G-Quadruplexes and Dnmt3a-mediated methylation of the c-Myc oncogene promoter</article-title>. <source>Int J Mol Sci</source>. (<year>2023</year>) <volume>25</volume>:<fpage>45</fpage>. doi: <pub-id pub-id-type="doi">10.3390/ijms25010045</pub-id>, PMID: <pub-id pub-id-type="pmid">38203216</pub-id></citation></ref>
<ref id="ref7"><label>7.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chu</surname> <given-names>AY</given-names></name> <name><surname>Tin</surname> <given-names>A</given-names></name> <name><surname>Schlosser</surname> <given-names>P</given-names></name> <name><surname>Ko</surname> <given-names>YA</given-names></name> <name><surname>Qiu</surname> <given-names>C</given-names></name> <name><surname>Yao</surname> <given-names>C</given-names></name> <etal/></person-group>. <article-title>Epigenome-wide association studies identify Dna methylation associated with kidney function</article-title>. <source>Nat Commun</source>. (<year>2017</year>) <volume>8</volume>:<fpage>1286</fpage>. doi: <pub-id pub-id-type="doi">10.1038/s41467-017-01297-7</pub-id>, PMID: <pub-id pub-id-type="pmid">29097680</pub-id></citation></ref>
<ref id="ref8"><label>8.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sabbatinelli</surname> <given-names>J</given-names></name> <name><surname>Giuliani</surname> <given-names>A</given-names></name> <name><surname>Kwiatkowska</surname> <given-names>KM</given-names></name> <name><surname>Matacchione</surname> <given-names>G</given-names></name> <name><surname>Belloni</surname> <given-names>A</given-names></name> <name><surname>Ramini</surname> <given-names>D</given-names></name> <etal/></person-group>. <article-title>Dna methylation-derived biological age and long-term mortality risk in subjects with type 2 diabetes</article-title>. <source>Cardiovasc Diabetol</source>. (<year>2024</year>) <volume>23</volume>:<fpage>250</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s12933-024-02351-7</pub-id>, PMID: <pub-id pub-id-type="pmid">39003492</pub-id></citation></ref>
<ref id="ref9"><label>9.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Jones</surname> <given-names>AC</given-names></name> <name><surname>Patki</surname> <given-names>A</given-names></name> <name><surname>Srinivasasainagendra</surname> <given-names>V</given-names></name> <name><surname>Hidalgo</surname> <given-names>BA</given-names></name> <name><surname>Tiwari</surname> <given-names>HK</given-names></name> <name><surname>Limdi</surname> <given-names>NA</given-names></name> <etal/></person-group>. <article-title>A methylation risk score for chronic kidney disease: a hypergen study</article-title>. <source>Sci Rep</source>. (<year>2024</year>) <volume>14</volume>:<fpage>17757</fpage>. doi: <pub-id pub-id-type="doi">10.1038/s41598-024-68470-z</pub-id>, PMID: <pub-id pub-id-type="pmid">39085340</pub-id></citation></ref>
<ref id="ref10"><label>10.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Morales Berstein</surname> <given-names>F</given-names></name> <name><surname>Mccartney</surname> <given-names>DL</given-names></name> <name><surname>Lu</surname> <given-names>AT</given-names></name> <name><surname>Tsilidis</surname> <given-names>KK</given-names></name> <name><surname>Bouras</surname> <given-names>E</given-names></name> <name><surname>Haycock</surname> <given-names>P</given-names></name> <etal/></person-group>. <article-title>Assessing the causal role of epigenetic clocks in the development of multiple cancers: a Mendelian randomization study</article-title>. <source>eLife</source>. (<year>2022</year>) <volume>11</volume>:<fpage>11</fpage>. doi: <pub-id pub-id-type="doi">10.7554/eLife.75374</pub-id>, PMID: <pub-id pub-id-type="pmid">35346416</pub-id></citation></ref>
<ref id="ref11"><label>11.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lee</surname> <given-names>HS</given-names></name> <name><surname>Park</surname> <given-names>T</given-names></name></person-group>. <article-title>The influences of DNA methylation and epigenetic clocks, on metabolic disease, in middle-aged Koreans</article-title>. <source>Clin Epigenetics</source>. (<year>2020</year>) <volume>12</volume>:<fpage>148</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s13148-020-00936-z</pub-id>, PMID: <pub-id pub-id-type="pmid">33059731</pub-id></citation></ref>
<ref id="ref12"><label>12.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gialluisi</surname> <given-names>A</given-names></name> <name><surname>Santoro</surname> <given-names>A</given-names></name> <name><surname>Tirozzi</surname> <given-names>A</given-names></name> <name><surname>Cerletti</surname> <given-names>C</given-names></name> <name><surname>Donati</surname> <given-names>MB</given-names></name> <name><surname>de Gaetano</surname> <given-names>G</given-names></name> <etal/></person-group>. <article-title>Epidemiological and genetic overlap among biological aging clocks: new challenges in biogerontology</article-title>. <source>Ageing Res Rev</source>. (<year>2021</year>) <volume>72</volume>:<fpage>101502</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.arr.2021.101502</pub-id>, PMID: <pub-id pub-id-type="pmid">34700008</pub-id></citation></ref>
<ref id="ref13"><label>13.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Plonski</surname> <given-names>NM</given-names></name> <name><surname>Chen</surname> <given-names>C</given-names></name> <name><surname>Dong</surname> <given-names>Q</given-names></name> <name><surname>Qin</surname> <given-names>N</given-names></name> <name><surname>Song</surname> <given-names>N</given-names></name> <name><surname>Parikh</surname> <given-names>HM</given-names></name> <etal/></person-group>. <article-title>Epigenetic age in peripheral blood among children, adolescent, and adult survivors of childhood cancer</article-title>. <source>JAMA Netw Open</source>. (<year>2023</year>) <volume>6</volume>:<fpage>e2310325</fpage>. doi: <pub-id pub-id-type="doi">10.1001/jamanetworkopen.2023.10325</pub-id>, PMID: <pub-id pub-id-type="pmid">37115548</pub-id></citation></ref>
<ref id="ref14"><label>14.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mendy</surname> <given-names>A</given-names></name> <name><surname>Mersha</surname> <given-names>TB</given-names></name></person-group>. <article-title>Epigenetic age acceleration and mortality risk prediction in U.S. adults</article-title>. <source>medRxiv</source>. [Preprint]. (<year>2024</year>) <fpage>2024.08.21.24312373</fpage>. doi: <pub-id pub-id-type="doi">10.1101/2024.08.21.24312373</pub-id></citation></ref>
<ref id="ref15"><label>15.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lin</surname> <given-names>Q</given-names></name> <name><surname>Weidner</surname> <given-names>CI</given-names></name> <name><surname>Costa</surname> <given-names>IG</given-names></name> <name><surname>Marioni</surname> <given-names>RE</given-names></name> <name><surname>Ferreira</surname> <given-names>MRP</given-names></name> <name><surname>Deary</surname> <given-names>IJ</given-names></name> <etal/></person-group>. <article-title>DNA methylation levels at individual age-associated CpG sites can be indicative for life expectancy</article-title>. <source>Aging (Albany NY)</source>. (<year>2016</year>) <volume>8</volume>:<fpage>394</fpage>&#x2013;<lpage>401</lpage>. doi: <pub-id pub-id-type="doi">10.18632/aging.100908</pub-id>, PMID: <pub-id pub-id-type="pmid">26928272</pub-id></citation></ref>
<ref id="ref16"><label>16.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ofori</surname> <given-names>EK</given-names></name> <name><surname>Adekena</surname> <given-names>CN</given-names></name> <name><surname>Boima</surname> <given-names>V</given-names></name> <name><surname>Asare-Anane</surname> <given-names>H</given-names></name> <name><surname>Yorke</surname> <given-names>E</given-names></name> <name><surname>Nyarko</surname> <given-names>ENY</given-names></name> <etal/></person-group>. <article-title>Serum leptin levels in patients with chronic kidney disease and hypertensive heart disease: an observational cross-sectional study</article-title>. <source>Health Sci Rep</source>. (<year>2023</year>) <volume>6</volume>:<fpage>e1053</fpage>. doi: <pub-id pub-id-type="doi">10.1002/hsr2.1053</pub-id>, PMID: <pub-id pub-id-type="pmid">36698704</pub-id></citation></ref>
<ref id="ref17"><label>17.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lu</surname> <given-names>AT</given-names></name> <name><surname>Quach</surname> <given-names>A</given-names></name> <name><surname>Wilson</surname> <given-names>JG</given-names></name> <name><surname>Reiner</surname> <given-names>AP</given-names></name> <name><surname>Aviv</surname> <given-names>A</given-names></name> <name><surname>Raj</surname> <given-names>K</given-names></name> <etal/></person-group>. <article-title>DNA methylation GrimAge strongly predicts lifespan and healthspan</article-title>. <source>Aging (Albany NY)</source>. (<year>2019</year>) <volume>11</volume>:<fpage>303</fpage>&#x2013;<lpage>27</lpage>. doi: <pub-id pub-id-type="doi">10.18632/aging.101684</pub-id>, PMID: <pub-id pub-id-type="pmid">30669119</pub-id></citation></ref>
<ref id="ref18"><label>18.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Fujita</surname> <given-names>Y</given-names></name> <name><surname>Taniguchi</surname> <given-names>Y</given-names></name> <name><surname>Shinkai</surname> <given-names>S</given-names></name> <name><surname>Tanaka</surname> <given-names>M</given-names></name> <name><surname>Ito</surname> <given-names>M</given-names></name></person-group>. <article-title>Secreted growth differentiation factor&#x202F;15 as a potential biomarker for mitochondrial dysfunctions in aging and age-related disorders</article-title>. <source>Geriatr Gerontol Int</source>. (<year>2016</year>) <volume>16</volume>:<fpage>17</fpage>&#x2013;<lpage>29</lpage>. doi: <pub-id pub-id-type="doi">10.1111/ggi.12724</pub-id>, PMID: <pub-id pub-id-type="pmid">27018280</pub-id></citation></ref>
<ref id="ref19"><label>19.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Han</surname> <given-names>K</given-names></name> <name><surname>Wang</surname> <given-names>J</given-names></name> <name><surname>Chu</surname> <given-names>Y</given-names></name> <name><surname>Liao</surname> <given-names>Q</given-names></name> <name><surname>Ding</surname> <given-names>Y</given-names></name> <name><surname>Zheng</surname> <given-names>D</given-names></name> <etal/></person-group>. <article-title>Deep learning based method for predicting DNA N6-methyladenosine sites</article-title>. <source>Methods</source>. (<year>2024</year>) <volume>230</volume>:<fpage>91</fpage>&#x2013;<lpage>8</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.ymeth.2024.07.012</pub-id>, PMID: <pub-id pub-id-type="pmid">39097179</pub-id></citation></ref>
<ref id="ref20"><label>20.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Baviera-Martineza</surname> <given-names>C</given-names></name> <name><surname>Martinez-Millana</surname> <given-names>A</given-names></name> <name><surname>Lopez-Casanova</surname> <given-names>FB</given-names></name></person-group>. <article-title>Integrating automation, interactive visualization, and unsupervised learning for enhanced diabetes management</article-title>. <source>Stud Health Technol Inform</source>. (<year>2024</year>) <volume>316</volume>:<fpage>1699</fpage>&#x2013;<lpage>703</lpage>. doi: <pub-id pub-id-type="doi">10.3233/SHTI240750</pub-id>, PMID: <pub-id pub-id-type="pmid">39176537</pub-id></citation></ref>
<ref id="ref21"><label>21.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhou</surname> <given-names>D</given-names></name> <name><surname>Tian</surname> <given-names>F</given-names></name> <name><surname>Tian</surname> <given-names>X</given-names></name> <name><surname>Sun</surname> <given-names>L</given-names></name> <name><surname>Huang</surname> <given-names>X</given-names></name> <name><surname>Zhao</surname> <given-names>F</given-names></name> <etal/></person-group>. <article-title>Diagnostic evaluation of a deep learning model for optical diagnosis of colorectal cancer</article-title>. <source>Nat Commun</source>. (<year>2020</year>) <volume>11</volume>:<fpage>2961</fpage>. doi: <pub-id pub-id-type="doi">10.1038/s41467-020-16777-6</pub-id>, PMID: <pub-id pub-id-type="pmid">32528084</pub-id></citation></ref>
<ref id="ref22"><label>22.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Anderson</surname> <given-names>JP</given-names></name> <name><surname>Parikh</surname> <given-names>JR</given-names></name> <name><surname>Shenfeld</surname> <given-names>DK</given-names></name> <name><surname>Ivanov</surname> <given-names>V</given-names></name> <name><surname>Marks</surname> <given-names>C</given-names></name> <name><surname>Church</surname> <given-names>BW</given-names></name> <etal/></person-group>. <article-title>Reverse engineering and evaluation of prediction models for progression to type 2 diabetes: an application of machine learning using electronic health records</article-title>. <source>J Diabetes Sci Technol</source>. (<year>2015</year>) <volume>10</volume>:<fpage>6</fpage>&#x2013;<lpage>18</lpage>. doi: <pub-id pub-id-type="doi">10.1177/1932296815620200</pub-id>, PMID: <pub-id pub-id-type="pmid">26685993</pub-id></citation></ref>
<ref id="ref23"><label>23.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Guo</surname> <given-names>J</given-names></name> <name><surname>He</surname> <given-names>Q</given-names></name> <name><surname>Li</surname> <given-names>Y</given-names></name></person-group>. <article-title>Machine learning-based prediction of vitamin D deficiency: NHANES 2001-2018</article-title>. <source>Front Endocrinol (Lausanne)</source>. (<year>2024</year>) <volume>15</volume>:<fpage>1327058</fpage>. doi: <pub-id pub-id-type="doi">10.3389/fendo.2024.1327058</pub-id>, PMID: <pub-id pub-id-type="pmid">38449846</pub-id></citation></ref>
<ref id="ref24"><label>24.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zheng</surname> <given-names>C</given-names></name> <name><surname>Li</surname> <given-names>L</given-names></name> <name><surname>Xu</surname> <given-names>R</given-names></name></person-group>. <article-title>Association of epigenetic clock with consensus molecular subtypes and overall survival of colorectal cancer</article-title>. <source>Cancer Epidemiol Biomarkers Prev</source>. (<year>2019</year>) <volume>28</volume>:<fpage>1720</fpage>&#x2013;<lpage>4</lpage>. doi: <pub-id pub-id-type="doi">10.1158/1055-9965.EPI-19-0208</pub-id>, PMID: <pub-id pub-id-type="pmid">31375479</pub-id></citation></ref>
<ref id="ref25"><label>25.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Levine</surname> <given-names>ME</given-names></name> <name><surname>Hosgood</surname> <given-names>HD</given-names></name> <name><surname>Chen</surname> <given-names>B</given-names></name> <name><surname>Absher</surname> <given-names>D</given-names></name> <name><surname>Assimes</surname> <given-names>T</given-names></name> <name><surname>Horvath</surname> <given-names>S</given-names></name></person-group>. <article-title>DNA methylation age of blood predicts future onset of lung cancer in the women's health initiative</article-title>. <source>Aging (Albany NY)</source>. (<year>2015</year>) <volume>7</volume>:<fpage>690</fpage>&#x2013;<lpage>700</lpage>. doi: <pub-id pub-id-type="doi">10.18632/aging.100809</pub-id>, PMID: <pub-id pub-id-type="pmid">26411804</pub-id></citation></ref>
<ref id="ref26"><label>26.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Vetter</surname> <given-names>VM</given-names></name> <name><surname>Spieker</surname> <given-names>J</given-names></name> <name><surname>Sommerer</surname> <given-names>Y</given-names></name> <name><surname>Buchmann</surname> <given-names>N</given-names></name> <name><surname>Kalies</surname> <given-names>CH</given-names></name> <name><surname>Regitz-Zagrosek</surname> <given-names>V</given-names></name> <etal/></person-group>. <article-title>DNA methylation age acceleration is associated with risk of diabetes complications</article-title>. <source>Commun Med</source>. (<year>2023</year>) <volume>3</volume>:<fpage>21</fpage>. doi: <pub-id pub-id-type="doi">10.1038/s43856-023-00250-8</pub-id>, PMID: <pub-id pub-id-type="pmid">36765171</pub-id></citation></ref>
<ref id="ref27"><label>27.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Miao</surname> <given-names>K</given-names></name> <name><surname>Hong</surname> <given-names>X</given-names></name> <name><surname>Cao</surname> <given-names>W</given-names></name> <name><surname>Lv</surname> <given-names>J</given-names></name> <name><surname>Yu</surname> <given-names>C</given-names></name> <name><surname>Huang</surname> <given-names>T</given-names></name> <etal/></person-group>. <article-title>Association between epigenetic age and type 2 diabetes mellitus or glycemic traits: a longitudinal twin study</article-title>. <source>Aging Cell</source>. (<year>2024</year>) <volume>23</volume>:<fpage>e14175</fpage>. doi: <pub-id pub-id-type="doi">10.1111/acel.14175</pub-id>, PMID: <pub-id pub-id-type="pmid">38660768</pub-id></citation></ref>
<ref id="ref28"><label>28.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Joo</surname> <given-names>M</given-names></name> <name><surname>Kim</surname> <given-names>D</given-names></name> <name><surname>Lee</surname> <given-names>MW</given-names></name> <name><surname>Lee</surname> <given-names>HJ</given-names></name> <name><surname>Kim</surname> <given-names>JM</given-names></name></person-group>. <article-title>Gdf15 promotes cell growth, migration, and invasion in gastric cancer by inducing Stat3 activation</article-title>. <source>Int J Mol Sci</source>. (<year>2023</year>) <volume>24</volume>:<fpage>2925</fpage>. doi: <pub-id pub-id-type="doi">10.3390/ijms24032925</pub-id>, PMID: <pub-id pub-id-type="pmid">36769245</pub-id></citation></ref>
<ref id="ref29"><label>29.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Siddiqui</surname> <given-names>JA</given-names></name> <name><surname>Pothuraju</surname> <given-names>R</given-names></name> <name><surname>Khan</surname> <given-names>P</given-names></name> <name><surname>Sharma</surname> <given-names>G</given-names></name> <name><surname>Muniyan</surname> <given-names>S</given-names></name> <name><surname>Seshacharyulu</surname> <given-names>P</given-names></name> <etal/></person-group>. <article-title>Pathophysiological role of growth differentiation factor 15 (Gdf15) in obesity, cancer, and cachexia</article-title>. <source>Cytokine Growth Factor Rev</source>. (<year>2022</year>) <volume>64</volume>:<fpage>71</fpage>&#x2013;<lpage>83</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.cytogfr.2021.11.002</pub-id>, PMID: <pub-id pub-id-type="pmid">34836750</pub-id></citation></ref>
<ref id="ref30"><label>30.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Dantas</surname> <given-names>E</given-names></name> <name><surname>Murthy</surname> <given-names>A</given-names></name> <name><surname>Ahmed</surname> <given-names>T</given-names></name> <name><surname>Ahmed</surname> <given-names>M</given-names></name> <name><surname>Ramsamooj</surname> <given-names>S</given-names></name> <name><surname>Hurd</surname> <given-names>MA</given-names></name> <etal/></person-group>. <article-title>Timp1 is an early biomarker for detection and prognosis of lung cancer</article-title>. <source>Clin Transl Med</source>. (<year>2023</year>) <volume>13</volume>:<fpage>e1391</fpage>. doi: <pub-id pub-id-type="doi">10.1002/ctm2.1391</pub-id>, PMID: <pub-id pub-id-type="pmid">37759102</pub-id></citation></ref>
<ref id="ref31"><label>31.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Tian</surname> <given-names>Z</given-names></name> <name><surname>Ou</surname> <given-names>G</given-names></name> <name><surname>Su</surname> <given-names>M</given-names></name> <name><surname>Li</surname> <given-names>R</given-names></name> <name><surname>Pan</surname> <given-names>L</given-names></name> <name><surname>Lin</surname> <given-names>X</given-names></name> <etal/></person-group>. <article-title>Timp1 derived from pancreatic cancer cells stimulates Schwann cells and promotes the occurrence of perineural invasion</article-title>. <source>Cancer Lett</source>. (<year>2022</year>) <volume>546</volume>:<fpage>215863</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.canlet.2022.215863</pub-id>, PMID: <pub-id pub-id-type="pmid">35961511</pub-id></citation></ref>
<ref id="ref32"><label>32.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Guccini</surname> <given-names>I</given-names></name> <name><surname>Revandkar</surname> <given-names>A</given-names></name> <name><surname>D'ambrosio</surname> <given-names>M</given-names></name> <name><surname>Colucci</surname> <given-names>M</given-names></name> <name><surname>Pasquini</surname> <given-names>E</given-names></name> <name><surname>Mosole</surname> <given-names>S</given-names></name> <etal/></person-group>. <article-title>Senescence reprogramming by Timp1 deficiency promotes prostate cancer metastasis</article-title>. <source>Cancer Cell</source>. (<year>2021</year>) <volume>39</volume>:<fpage>68</fpage>&#x2013;<lpage>82.e9</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.ccell.2020.10.012</pub-id>, PMID: <pub-id pub-id-type="pmid">33186519</pub-id></citation></ref>
<ref id="ref33"><label>33.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lin</surname> <given-names>X</given-names></name> <name><surname>Zhao</surname> <given-names>R</given-names></name> <name><surname>Bin</surname> <given-names>Y</given-names></name> <name><surname>Huo</surname> <given-names>R</given-names></name> <name><surname>Xue</surname> <given-names>G</given-names></name> <name><surname>Wu</surname> <given-names>J</given-names></name></person-group>. <article-title>Timp1 promotes thyroid cancer cell progression through macrophage phenotypic polarization via the Pi3K/Akt signaling pathway</article-title>. <source>Genomics</source>. (<year>2024</year>) <volume>116</volume>:<fpage>110914</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.ygeno.2024.110914</pub-id>, PMID: <pub-id pub-id-type="pmid">39128817</pub-id></citation></ref>
<ref id="ref34"><label>34.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yang</surname> <given-names>L</given-names></name> <name><surname>Jiang</surname> <given-names>Q</given-names></name> <name><surname>Li</surname> <given-names>DZ</given-names></name> <name><surname>Zhou</surname> <given-names>X</given-names></name> <name><surname>Yu</surname> <given-names>DS</given-names></name> <name><surname>Zhong</surname> <given-names>J</given-names></name></person-group>. <article-title>Timp1 mRNA in tumor-educated platelets is diagnostic biomarker for colorectal cancer</article-title>. <source>Aging (Albany NY)</source>. (<year>2019</year>) <volume>11</volume>:<fpage>8998</fpage>&#x2013;<lpage>9012</lpage>. doi: <pub-id pub-id-type="doi">10.18632/aging.102366</pub-id>, PMID: <pub-id pub-id-type="pmid">31639773</pub-id></citation></ref>
<ref id="ref35"><label>35.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lu</surname> <given-names>AT</given-names></name> <name><surname>Binder</surname> <given-names>AM</given-names></name> <name><surname>Zhang</surname> <given-names>J</given-names></name> <name><surname>Yan</surname> <given-names>Q</given-names></name> <name><surname>Reiner</surname> <given-names>AP</given-names></name> <name><surname>Cox</surname> <given-names>SR</given-names></name> <etal/></person-group>. <article-title>DNA methylation GrimAge version 2</article-title>. <source>Aging (Albany NY)</source>. (<year>2022</year>) <volume>14</volume>:<fpage>9484</fpage>&#x2013;<lpage>549</lpage>. doi: <pub-id pub-id-type="doi">10.18632/aging.204434</pub-id>, PMID: <pub-id pub-id-type="pmid">36516495</pub-id></citation></ref>
<ref id="ref36"><label>36.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Larkin</surname> <given-names>HD</given-names></name></person-group>. <article-title>AAP recommends immediate, intensive treatment for child obesity</article-title>. <source>JAMA</source>. (<year>2023</year>) <volume>329</volume>:<fpage>364</fpage>. doi: <pub-id pub-id-type="doi">10.1001/jama.2022.24498</pub-id>, PMID: <pub-id pub-id-type="pmid">36652624</pub-id></citation></ref>
<ref id="ref37"><label>37.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kposowa</surname> <given-names>AJ</given-names></name> <name><surname>Aly Ezzat</surname> <given-names>D</given-names></name> <name><surname>Breault</surname> <given-names>K</given-names></name></person-group>. <article-title>Diabetes mellitus and marital status: evidence from the national longitudinal mortality study on the effect of marital dissolution and the death of a spouse</article-title>. <source>Int J Gen Med</source>. (<year>2021</year>) <volume>14</volume>:<fpage>1881</fpage>&#x2013;<lpage>8</lpage>. doi: <pub-id pub-id-type="doi">10.2147/IJGM.S307436</pub-id>, PMID: <pub-id pub-id-type="pmid">34040420</pub-id></citation></ref>
<ref id="ref38"><label>38.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Escolar-Pujolar</surname> <given-names>A</given-names></name> <name><surname>C&#x00F3;rdoba Do&#x00F1;a</surname> <given-names>JA</given-names></name> <name><surname>Goicolea Jul&#x00ED;an</surname> <given-names>I</given-names></name> <name><surname>Rodr&#x00ED;guez</surname> <given-names>GJ</given-names></name> <name><surname>Santos S&#x00E1;nchez</surname> <given-names>V</given-names></name> <name><surname>Mayoral S&#x00E1;nchez</surname> <given-names>E</given-names></name> <etal/></person-group>. <article-title>The effect of marital status on social and gender inequalities in diabetes mortality in Andalusia</article-title>. <source>Endocrinol Diabetes Nutr (Engl Ed)</source>. (<year>2018</year>) <volume>65</volume>:<fpage>21</fpage>&#x2013;<lpage>9</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.endinu.2017.10.006</pub-id>, PMID: <pub-id pub-id-type="pmid">29233513</pub-id></citation></ref>
<ref id="ref39"><label>39.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ramezankhani</surname> <given-names>A</given-names></name> <name><surname>Azizi</surname> <given-names>F</given-names></name> <name><surname>Hadaegh</surname> <given-names>F</given-names></name></person-group>. <article-title>Associations of marital status with diabetes, hypertension, cardiovascular disease and all-cause mortality: a long term follow-up study</article-title>. <source>PLoS One</source>. (<year>2019</year>) <volume>14</volume>:<fpage>e0215593</fpage>. doi: <pub-id pub-id-type="doi">10.1371/journal.pone.0215593</pub-id>, PMID: <pub-id pub-id-type="pmid">31009512</pub-id></citation></ref>
<ref id="ref40"><label>40.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Haupt</surname> <given-names>S</given-names></name> <name><surname>Caramia</surname> <given-names>F</given-names></name> <name><surname>Klein</surname> <given-names>SL</given-names></name> <name><surname>Rubin</surname> <given-names>JB</given-names></name> <name><surname>Haupt</surname> <given-names>Y</given-names></name></person-group>. <article-title>Sex disparities matter in cancer development and therapy</article-title>. <source>Nat Rev Cancer</source>. (<year>2021</year>) <volume>21</volume>:<fpage>393</fpage>&#x2013;<lpage>407</lpage>. doi: <pub-id pub-id-type="doi">10.1038/s41568-021-00348-y</pub-id>, PMID: <pub-id pub-id-type="pmid">33879867</pub-id></citation></ref>
<ref id="ref41"><label>41.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Siegfried</surname> <given-names>JM</given-names></name></person-group>. <article-title>Sex and gender differences in lung cancer and chronic obstructive lung disease</article-title>. <source>Endocrinology</source>. (<year>2022</year>) <volume>163</volume>:<fpage>bqab254</fpage>. doi: <pub-id pub-id-type="doi">10.1210/endocr/bqab254</pub-id>, PMID: <pub-id pub-id-type="pmid">34927202</pub-id></citation></ref>
<ref id="ref42"><label>42.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bhardwaj</surname> <given-names>PV</given-names></name> <name><surname>Gupta</surname> <given-names>S</given-names></name> <name><surname>Elyash</surname> <given-names>A</given-names></name> <name><surname>Teplinsky</surname> <given-names>E</given-names></name></person-group>. <article-title>Male breast cancer: a review on diagnosis, treatment, and survivorship</article-title>. <source>Curr Oncol Rep</source>. (<year>2024</year>) <volume>26</volume>:<fpage>34</fpage>&#x2013;<lpage>45</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s11912-023-01489-z</pub-id></citation></ref>
<ref id="ref43"><label>43.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Coelingh Bennink</surname> <given-names>HJT</given-names></name> <name><surname>Egberts</surname> <given-names>JFM</given-names></name> <name><surname>Mol</surname> <given-names>JA</given-names></name> <name><surname>Roes</surname> <given-names>KCB</given-names></name> <name><surname>van Diest</surname> <given-names>PJ</given-names></name></person-group>. <article-title>Breast cancer and major deviations of genetic and gender-related structures and function</article-title>. <source>J Clin Endocrinol Metab</source>. (<year>2020</year>) <volume>105</volume>:<fpage>e3065</fpage>&#x2013;<lpage>74</lpage>. doi: <pub-id pub-id-type="doi">10.1210/clinem/dgaa404</pub-id>, PMID: <pub-id pub-id-type="pmid">32594127</pub-id></citation></ref>
<ref id="ref44"><label>44.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Caliri</surname> <given-names>AW</given-names></name> <name><surname>Tommasi</surname> <given-names>S</given-names></name> <name><surname>Besaratinia</surname> <given-names>A</given-names></name></person-group>. <article-title>Relationships among smoking, oxidative stress, inflammation, macromolecular damage, and cancer</article-title>. <source>Mutat Res Rev Mutat Res</source>. (<year>2021</year>) <volume>787</volume>:<fpage>108365</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.mrrev.2021.108365</pub-id>, PMID: <pub-id pub-id-type="pmid">34083039</pub-id></citation></ref>
<ref id="ref45"><label>45.</label><citation citation-type="book"><person-group person-group-type="author"><collab id="coll3">National Center for Chronic Disease Prevention and Health Promotion (US) Office on Smoking and Health</collab></person-group>. <source>The health consequences of smoking&#x2014;50 years of progress: a report of the surgeon general</source>. <publisher-loc>Atlanta (GA)</publisher-loc>: <publisher-name>Centers for Disease Control and Prevention (US)</publisher-name> (<year>2014</year>).</citation></ref>
<ref id="ref46"><label>46.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Viale</surname> <given-names>PH</given-names></name></person-group>. <article-title>The American Cancer Society's facts &#x0026; figures: 2020 edition</article-title>. <source>J Adv Pract Oncol</source>. (<year>2020</year>) <volume>11</volume>:<fpage>135</fpage>&#x2013;<lpage>6</lpage>. doi: <pub-id pub-id-type="doi">10.6004/jadpro.2020.11.2.1</pub-id>, PMID: <pub-id pub-id-type="pmid">33532112</pub-id></citation></ref>
<ref id="ref47"><label>47.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Larsson</surname> <given-names>SC</given-names></name> <name><surname>Burgess</surname> <given-names>S</given-names></name></person-group>. <article-title>Appraising the causal role of smoking in multiple diseases: a systematic review and meta-analysis of Mendelian randomization studies</article-title>. <source>EBioMedicine</source>. (<year>2022</year>) <volume>82</volume>:<fpage>104154</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.ebiom.2022.104154</pub-id>, PMID: <pub-id pub-id-type="pmid">35816897</pub-id></citation></ref>
<ref id="ref48"><label>48.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Didovyk</surname> <given-names>A</given-names></name> <name><surname>Tsimring</surname> <given-names>LS</given-names></name></person-group>. <article-title>Synthetic gene circuits learn to classify</article-title>. <source>Cell Syst</source>. (<year>2017</year>) <volume>4</volume>:<fpage>151</fpage>&#x2013;<lpage>3</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.cels.2017.02.001</pub-id>, PMID: <pub-id pub-id-type="pmid">28231449</pub-id></citation></ref>
<ref id="ref49"><label>49.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lugo</surname> <given-names>A</given-names></name> <name><surname>Peveri</surname> <given-names>G</given-names></name> <name><surname>Gallus</surname> <given-names>S</given-names></name></person-group>. <article-title>Should we consider gallbladder cancer a new smoking-related cancer? A comprehensive meta-analysis focused on dose-response relationships</article-title>. <source>Int J Cancer</source>. (<year>2020</year>) <volume>146</volume>:<fpage>3304</fpage>&#x2013;<lpage>11</lpage>. doi: <pub-id pub-id-type="doi">10.1002/ijc.32681</pub-id>, PMID: <pub-id pub-id-type="pmid">31513278</pub-id></citation></ref>
<ref id="ref50"><label>50.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Scala</surname> <given-names>M</given-names></name> <name><surname>Bosetti</surname> <given-names>C</given-names></name> <name><surname>Bagnardi</surname> <given-names>V</given-names></name> <name><surname>Possenti</surname> <given-names>I</given-names></name> <name><surname>Specchia</surname> <given-names>C</given-names></name> <name><surname>Gallus</surname> <given-names>S</given-names></name> <etal/></person-group>. <article-title>Dose-response relationships between cigarette smoking and breast cancer risk: a systematic review and meta-analysis</article-title>. <source>J Epidemiol</source>. (<year>2023</year>) <volume>33</volume>:<fpage>640</fpage>&#x2013;<lpage>8</lpage>. doi: <pub-id pub-id-type="doi">10.2188/jea.JE20220206</pub-id>, PMID: <pub-id pub-id-type="pmid">36967121</pub-id></citation></ref>
<ref id="ref51"><label>51.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Malevolti</surname> <given-names>MC</given-names></name> <name><surname>Lugo</surname> <given-names>A</given-names></name> <name><surname>Scala</surname> <given-names>M</given-names></name> <name><surname>Gallus</surname> <given-names>S</given-names></name> <name><surname>Gorini</surname> <given-names>G</given-names></name> <name><surname>Lachi</surname> <given-names>A</given-names></name> <etal/></person-group>. <article-title>Dose-risk relationships between cigarette smoking and cervical cancer: a systematic review and meta-analysis</article-title>. <source>Eur J Cancer Prev</source>. (<year>2023</year>) <volume>32</volume>:<fpage>171</fpage>&#x2013;<lpage>83</lpage>. doi: <pub-id pub-id-type="doi">10.1097/CEJ.0000000000000773</pub-id>, PMID: <pub-id pub-id-type="pmid">36440802</pub-id></citation></ref>
<ref id="ref52"><label>52.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zeilinger</surname> <given-names>S</given-names></name> <name><surname>K&#x00FC;hnel</surname> <given-names>B</given-names></name> <name><surname>Klopp</surname> <given-names>N</given-names></name> <name><surname>Baurecht</surname> <given-names>H</given-names></name> <name><surname>Kleinschmidt</surname> <given-names>A</given-names></name> <name><surname>Gieger</surname> <given-names>C</given-names></name> <etal/></person-group>. <article-title>Tobacco smoking leads to extensive genome-wide changes in DNA methylation</article-title>. <source>PLoS One</source>. (<year>2013</year>) <volume>8</volume>:<fpage>e63812</fpage>. doi: <pub-id pub-id-type="doi">10.1371/journal.pone.0063812</pub-id>, PMID: <pub-id pub-id-type="pmid">23691101</pub-id></citation></ref>
<ref id="ref53"><label>53.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Su</surname> <given-names>D</given-names></name> <name><surname>Wang</surname> <given-names>X</given-names></name> <name><surname>Campbell</surname> <given-names>MR</given-names></name> <name><surname>Porter</surname> <given-names>DK</given-names></name> <name><surname>Pittman</surname> <given-names>GS</given-names></name> <name><surname>Bennett</surname> <given-names>BD</given-names></name> <etal/></person-group>. <article-title>Distinct epigenetic effects of tobacco smoking in whole blood and among leukocyte subtypes</article-title>. <source>PLoS One</source>. (<year>2016</year>) <volume>11</volume>:<fpage>e0166486</fpage>. doi: <pub-id pub-id-type="doi">10.1371/journal.pone.0166486</pub-id>, PMID: <pub-id pub-id-type="pmid">27935972</pub-id></citation></ref>
<ref id="ref54"><label>54.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Miller</surname> <given-names>KD</given-names></name> <name><surname>Ortiz</surname> <given-names>AP</given-names></name> <name><surname>Pinheiro</surname> <given-names>PS</given-names></name> <name><surname>Bandi</surname> <given-names>P</given-names></name> <name><surname>Minihan</surname> <given-names>A</given-names></name> <name><surname>Fuchs</surname> <given-names>HE</given-names></name> <etal/></person-group>. <article-title>Cancer statistics for the US Hispanic/Latino population, 2021</article-title>. <source>CA Cancer J Clin</source>. (<year>2021</year>) <volume>71</volume>:<fpage>466</fpage>&#x2013;<lpage>87</lpage>. doi: <pub-id pub-id-type="doi">10.3322/caac.21695</pub-id>, PMID: <pub-id pub-id-type="pmid">34545941</pub-id></citation></ref>
</ref-list>
</back>
</article>