<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="2.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Endocrinol.</journal-id>
<journal-title>Frontiers in Endocrinology</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Endocrinol.</abbrev-journal-title>
<issn pub-type="epub">1664-2392</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fendo.2025.1644396</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Endocrinology</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Intelligent prediction of thyroid cancer in China based on GBD data and hospital electronic medical records: disease burden analysis combined with multiple machine learning models</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Yang</surname>
<given-names>Lina</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2898975/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Zhang</surname>
<given-names>Shixia</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Wang</surname>
<given-names>Xinguo</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Yang</surname>
<given-names>Jianjun</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/3149024/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Chen</surname>
<given-names>Mengya</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<xref ref-type="author-notes" rid="fn001">
<sup>*</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>Development Department of the Wisdom Hospital, Shandong Provincial Third Hospital</institution>, <addr-line>Jinan</addr-line>,&#xa0;<country>China</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>Department of General Practice, Shandong Provincial Third Hospital</institution>, <addr-line>Jinan</addr-line>,&#xa0;<country>China</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>Department of Medical Records, Shandong Provincial Third Hospital</institution>, <addr-line>Jinan</addr-line>,&#xa0;<country>China</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>Edited by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/100397/overview">Sandeep Kumar Mishra</ext-link>, Yale University, United States</p>
</fn>
<fn fn-type="edited-by">
<p>Reviewed by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1837590/overview">Pengzhe Qin</ext-link>, Guangzhou CDC, China</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/3118640/overview">Padma Tatiparti</ext-link>, Gokaraju Rangaraju Institute of Engineering and Technology (GRIET), India</p>
</fn>
<fn fn-type="corresp" id="fn001">
<p>*Correspondence: Mengya Chen, <email xlink:href="mailto:1264377210@qq.com">1264377210@qq.com</email>
</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>20</day>
<month>08</month>
<year>2025</year>
</pub-date>
<pub-date pub-type="collection">
<year>2025</year>
</pub-date>
<volume>16</volume>
<elocation-id>1644396</elocation-id>
<history>
<date date-type="received">
<day>10</day>
<month>06</month>
<year>2025</year>
</date>
<date date-type="accepted">
<day>31</day>
<month>07</month>
<year>2025</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2025 Yang, Zhang, Wang, Yang and Chen.</copyright-statement>
<copyright-year>2025</copyright-year>
<copyright-holder>Yang, Zhang, Wang, Yang and Chen</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>This study aims to conduct an in-depth analysis of the disease burden pattern and future trends of thyroid cancer in China, and constructed an intelligent prediction model in combination with hospital electronic medical record data. It comprehensively reveals the disease burden trend of thyroid cancer in China, predicts the mortality rate of thyroid cancer in China, and emphasizes the causal role of high BMI as an important controllable risk factor. And provided a high-precision prediction model for benign and malignant thyroid cancer. The results show that the prevalence of thyroid cancer in China has shown a significant upward trend from 1990 to 2021, especially among women, and the peak age of onset has shifted later. The mortality rate of men is on the rise, while that of women is on the decline. The risk of thyroid cancer mortality caused by high BMI significantly increases during this period, and MR analysis confirms that high BMI increases the risk of thyroid cancer. The ARIMA model predicts that the prevalence of thyroid cancer in China will continue to increase in the next ten years, while the mortality rate will remain relatively stable. Among the machine learning models, XGBoost achieved the highest predictive accuracy and identified BMI as the most influential clinical feature in distinguishing between benign and malignant thyroid tumors. This study provides a solid scientific basis for the development of more accurate and effective strategies for the prevention, early diagnosis, and management of thyroid cancer in China and even globally, and provides a feasible path for the use of artificial intelligence assisted diagnosis in clinical practice.</p>
</abstract>
<kwd-group>
<kwd>thyroid cancer</kwd>
<kwd>disease burden</kwd>
<kwd>body mass index</kwd>
<kwd>EMR</kwd>
<kwd>Mendelian randomization</kwd>
<kwd>machine learning</kwd>
</kwd-group>
<counts>
<fig-count count="4"/>
<table-count count="4"/>
<equation-count count="3"/>
<ref-count count="46"/>
<page-count count="10"/>
<word-count count="5411"/>
</counts>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-in-acceptance</meta-name>
<meta-value>Thyroid Endocrinology</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec id="s1" sec-type="intro">
<label>1</label>
<title>Introduction</title>
<p>Thyroid cancer is one of the most common endocrine malignancies and ranks prominently among head and neck cancers worldwide, accounting for about 3% to 4% of all cancer cases (<xref ref-type="bibr" rid="B1">1</xref>, <xref ref-type="bibr" rid="B2">2</xref>). In the past four decades, the prevalence of thyroid cancer worldwide has shown a significant upward trend in many countries (<xref ref-type="bibr" rid="B3">3</xref>).</p>
<p>The thyroid gland is a butterfly-shaped gland located in the front of the neck. Its main function is to secrete thyroid hormones (<xref ref-type="bibr" rid="B4">4</xref>), which regulate almost all physiological activities such as metabolism, energy balance, heart rate, body temperature, and even brain development. Therefore, maintaining normal thyroid hormone levels is essential to maintaining good health (<xref ref-type="bibr" rid="B5">5</xref>). However, when this critical gland becomes cancerous, the effects are profound and complex. As the most common malignant tumor of the endocrine system, thyroid cancer has a profound impact on the patient&#x2019;s quality of life and long-term prognosis (<xref ref-type="bibr" rid="B6">6</xref>). These impacts are not limited to the physiological level, but also include psychological and social dimensions, making the management of thyroid cancer a complex process that requires comprehensive consideration (<xref ref-type="bibr" rid="B7">7</xref>).</p>
<p>To fully understand and address the increasing disease burden of thyroid cancer, the GBD data provides a valuable and publicly accessible comprehensive database, covering detailed data on 354 diseases and injuries worldwide (<xref ref-type="bibr" rid="B8">8</xref>, <xref ref-type="bibr" rid="B9">9</xref>). The GBD data can effectively identify the latest trends and changes in thyroid cancer. Existing studies have extensively explored the overall global trends of thyroid cancer (<xref ref-type="bibr" rid="B10">10</xref>), and conducted specific analyses on the epidemiology of thyroid cancer within China (<xref ref-type="bibr" rid="B11">11</xref>&#x2013;<xref ref-type="bibr" rid="B13">13</xref>). In addition, some comparative studies have contrasted the trends of thyroid cancer in different sociodemographic index (SDI) regions, between China and the United States, within the European Union, and among certain countries (<xref ref-type="bibr" rid="B14">14</xref>&#x2013;<xref ref-type="bibr" rid="B17">17</xref>). However, at present, there are still obvious deficiencies in the comprehensive comparative analysis of the trend of thyroid cancer in China. Combining GBD macro-level data with micro-level electronic medical records offers a comprehensive view that bridges national trends and clinical realities. This kind of comparative analysis is crucial for China to identify its room for improvement in disease prevention and control and draw on the successful experiences of other countries.</p>
<p>This study uses GBD data to analyze and compare thyroid cancer patterns in China and predict future trends. The research analyzed key indicators such as the prevalence rate and mortality rate, and deeply explored the influence of factors such as gender and age on the disease burden. Furthermore, given that a high body mass index (BMI) is regarded as an important risk factor for thyroid cancer (<xref ref-type="bibr" rid="B18">18</xref>), this study will further explore the risk of attributable death and its causal relationship with thyroid cancer. Combined with the outpatient data of hospitals, the machine learning model is utilized to predict the future prevalence trend of thyroid cancer, with the expectation of providing empirical basis for formulating more precise prevention, control and treatment strategies for thyroid cancer in China and even globally.</p>
</sec>
<sec id="s2" sec-type="materials|methods">
<label>2</label>
<title>Materials and methods</title>
<sec id="s2_1">
<label>2.1</label>
<title>Materials</title>
<sec id="s2_1_1">
<label>2.1.1</label>
<title>Global burden Of disease data</title>
<p>This study will utilize the publicly available data from the GBD study in 2021 to obtain key epidemiological indicators such as the prevalence and mortality of thyroid cancer in China and globally from 1990 to 2021. Thyroid cancer is divided into various types, including papillary carcinoma, follicular carcinoma, poorly differentiated carcinoma, undifferentiated carcinoma, and medullary carcinoma. The diagnostic codes for thyroid cancer in this study include C73-C73.9, D09.3, D09.8, D34-D34.9, D44.0, and Z85.850 in ICD-10.The GBD data is released by the Institute for Health Metrics and Evaluation (IHME), providing a comprehensive assessment of the burden of disease at the global, regional and national levels, ensuring the authority and comparability of the data (<xref ref-type="bibr" rid="B19">19</xref>). All GBD data through its official database (Global Burden of diseases Study 2021, <ext-link ext-link-type="uri" xlink:href="http://www.healthdata.org/gbd">http://www.healthdata.org/gbd</ext-link>).</p>
</sec>
<sec id="s2_1_2">
<label>2.1.2</label>
<title>Electronic medical record data</title>
<p>This study will collect the clinical data of patients with thyroid cancer from the Electronic Medical Records (EMR) system of our hospital. To ensure the consistency of data time, the time range ends with thyroid cancer patients who visited before 2021 (including 2021).The collected clinical indicators include the basic information of the patients (such as gender and age), physical examination data (such as BMI), and biochemical indicators related to thyroid function (such as TG, TP0AB, TGAB, TSH, FT4, FT3), as well as the final benign and malignant diagnosis results. These data are crucial for building precise machine learning prediction models. To ensure patient privacy and data security, all electronic medical record data will undergo strict anonymization and de-identification processing before analysis. To ensure data security, generate a unique ID for each patient that does not contain any personal information, and use this ID instead of the real identity in the analysis.</p>
</sec>
</sec>
<sec id="s2_2">
<label>2.2</label>
<title>Methods</title>
<sec id="s2_2_1">
<label>2.2.1</label>
<title>The autoregressive integrated moving average model</title>
<p>The Autoregressive Integrated Moving Average (ARIMA) model is a widely used statistical method for analyzing and forecasting time series data. It works by analyzing the autocorrelation and non-stationarity present in the data. The core of the ARIMA model lies in its three components: the Autoregressive (AR) part uses a linear combination of past values to predict the current value; the Integrated (I) part addresses non-stationarity by differencing the data until it becomes stationary; and the Moving Average (MA) part uses a linear combination of past forecast errors to improve predictions.</p>
<p>An ARIMA model is typically denoted as ARIMA(p, d, q), where p is the order of the autoregressive component, d is the order of differencing, and q is the order of the moving average component. Building an ARIMA model involves several key steps: checking for stationarity, selecting appropriate model orders using Autocorrelation and Partial Autocorrelation Functions, estimating parameters, performing diagnostics, and generating forecasts. ARIMA is well-suited for time series data with strong autocorrelation and sees broad use in fields such as economics, finance, and meteorology. However, it assumes a linear relationship in the data and may not perform well for complex nonlinear patterns (<xref ref-type="bibr" rid="B20">20</xref>, <xref ref-type="bibr" rid="B21">21</xref>). In this study, the ARIMA model was used based on historical GBD data to predict long-term trends in future prevalence and mortality rates, provided important evidence for public health decision-making.</p>
<p>The ARIMA model analysis was conducted in the R language environment, mainly utilizing the auto. arima() function in the forecast package. Before applying the ARIMA model, we first conducted a stationarity test on the original time series data. According to the test results, in order to eliminate the non stationarity of the sequence, we performed first-order differencing (d=1) on both the incidence and mortality data. The differencing operation ensured that the mean and variance of the sequence remained constant over time, meeting the requirements of ARIMA model for stationarity.</p>
<p>The auto. arima() function evaluates the goodness of fit of models with different combinations of p, d, and q based on the Akaike Information Criterion (AIC), and selects the optimal model. For the prevalence rate, the optimal model determined is ARIMA (1,1,1), with an AIC value of -140; For mortality rate, the optimal model determined is ARIMA (0,1,1), with an AIC value of -19.88. After the model is constructed, it is validated by checking the autocorrelation function (ACF) of the residual sequence. In addition, we also checked the normality distribution of the residuals to ensure the validity of the model assumptions.</p>
</sec>
<sec id="s2_2_2">
<label>2.2.2</label>
<title>Mendelian randomization analysis</title>
<p>Mendelian randomization (MR) is a method used to infer causal relationships between exposure factors and disease outcomes (<xref ref-type="bibr" rid="B22">22</xref>). We employed it to analyze the association between body mass index (BMI) and thyroid cancer. The core idea is that if a genetic variation is strongly correlated with the exposure factor, independent of confounding factors, and affects the disease outcome through the exposure factor, then the association between this genetic variation and the disease outcome can be used to infer the causal relationship between the exposure factor and the disease outcome (<xref ref-type="bibr" rid="B23">23</xref>).</p>
</sec>
<sec id="s2_2_3">
<label>2.2.3</label>
<title>Analysis machine learning prediction model</title>
<p>This study constructed and trained six machine learning classification models, achieving the prediction of benign and malignant thyroid cancer. XGBoost is a kind of efficient, flexible and scalable gradient boosting decision tree algorithm, which performs well in various prediction tasks (<xref ref-type="bibr" rid="B24">24</xref>, <xref ref-type="bibr" rid="B25">25</xref>). RandomForest improves the prediction accuracy and robustness by constructing multiple decision trees and taking their average results (<xref ref-type="bibr" rid="B26">26</xref>). DecisionTree represents decision rules through a tree-like structure (<xref ref-type="bibr" rid="B27">27</xref>). Gaussian Naive Bayes (GNB) is a probabilistic classifier based on Bayes&#x2019; theorem, assuming that features are independent of each other and follow a Gaussian distribution (<xref ref-type="bibr" rid="B28">28</xref>). Multi-layer Perceptron (MLP) is a kind of feedforward artificial neural network that contains at least one hidden layer and is capable of learning complex nonlinear relationships (<xref ref-type="bibr" rid="B29">29</xref>). The Support Vector Machine (SVM) separates data points of different categories by finding the optimal hyperplane (<xref ref-type="bibr" rid="B30">30</xref>, <xref ref-type="bibr" rid="B31">31</xref>).</p>
</sec>
</sec>
</sec>
<sec id="s3" sec-type="results">
<label>3</label>
<title>Results</title>
<sec id="s3_1">
<label>3.1</label>
<title>The prevalence rate of thyroid cancer in China from 1990 to 2021</title>
<p>
<xref ref-type="fig" rid="f1">
<bold>Figures&#xa0;1A, C</bold>
</xref> analyze the prevalence of thyroid cancer among women and men in China from 1990 to 2021. In 1990 (<xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1A</bold>
</xref>), the crude prevalence rate of thyroid cancer in China increased with age, and the prevalence rate peaked at the age of 55-59. However, in 2021 (<xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1C</bold>
</xref>), the peak prevalence rate for women shifted to the age of 60-64, while that for men remained at 55-59, showing a significant decline at the age of 60-64. Since 1990, the overall prevalence rate has shown a marked increase. For women, the prevalence rate is higher than that of men in most age groups. Moreover, the development trend of the disease among women is largely consistent, with a decline occurring between the ages of 45 and 49.</p>
<fig id="f1" position="float">
<label>Figure&#xa0;1</label>
<caption>
<p>The prevalence and mortality rates of thyroid cancer in China from 1990 to 2021. <bold>(A)</bold> the rate of prevalence in 1990. <bold>(B)</bold> the rate of mortality in 1990. <bold>(C)</bold> the rate of prevalence in 2021. <bold>(D)</bold> the rate of mortality in 2021.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fendo-16-1644396-g001.tif">
<alt-text content-type="machine-generated">Four line graphs display data by sex and age. Graph A and C illustrate prevalence rates, with females showing higher rates than males, especially in middle age. Graph B and D depict death rates, where males have higher rates, particularly in older age groups. Each graph includes shaded areas indicating variability.</alt-text>
</graphic>
</fig>
<p>Between 1990 and 2021, cases per 100,000 people rose from 0.87 (95%UI 0.69, 1.0) to 3.88 (95%UI 3.12, 4.88). Among males, the number of affected cases increased from 0.19 (95%UI 0.15, 0.26) to 1.55 (95%UI 1.11, 2.08). The number of female patients increased from 0.68 (95%UI 0.49, 0.84) to 2.33 (95%UI 1.69, 3.46).</p>
<p>The ASPR of the entire population increased from 8.1 (6.41, 9.66) in 1990 to 20.01 (16.14, 25.23). The proportion of males increased from 3.52 (2.77, 4.73) to 15.87 (11.35, 20.96). The ASPR of females increased from 13 (9.36, 16.16) to 24.24 (17.62, 36.4). This indicates that the prevalence rates of both men and women have increased, and the ASPR of women has always been higher than that of men (<xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref>).</p>
<table-wrap id="T1" position="float">
<label>Table&#xa0;1</label>
<caption>
<p>The prevalence and mortality rates of thyroid cancer in China from 1990 to 2021.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" align="left">Disease burden, per 100,000 no. (95%UI)</th>
<th valign="middle" align="left">1990</th>
<th valign="middle" align="left">2021</th>
</tr>
</thead>
<tbody>
<tr>
<th valign="middle" colspan="3" align="left">Prevalence case</th>
</tr>
<tr>
<td valign="middle" align="left">Both</td>
<td valign="middle" align="left">0.87 (0.69,1.0)</td>
<td valign="middle" align="left">3.88 (3.12,4.88)</td>
</tr>
<tr>
<td valign="middle" align="left">Female</td>
<td valign="middle" align="left">0.68 (0.49,0.84)</td>
<td valign="middle" align="left">2.33 (1.69,3.46)</td>
</tr>
<tr>
<td valign="middle" align="left">Male</td>
<td valign="middle" align="left">0.19 (0.15,0.26)</td>
<td valign="middle" align="left">1.55 (1.11,2.08)</td>
</tr>
<tr>
<th valign="middle" colspan="3" align="left">ASPR</th>
</tr>
<tr>
<td valign="middle" align="left">Both</td>
<td valign="middle" align="left">8.1 (6.41,9.66)</td>
<td valign="middle" align="left">20.01 (16.14,25.23)</td>
</tr>
<tr>
<td valign="middle" align="left">Female</td>
<td valign="middle" align="left">13 (9.36,16.16)</td>
<td valign="middle" align="left">24.24 (17.62,36.4)</td>
</tr>
<tr>
<td valign="middle" align="left">Male</td>
<td valign="middle" align="left">3.52 (2.77,4.73)</td>
<td valign="middle" align="left">15.87 (11.35,20.96)</td>
</tr>
<tr>
<th valign="middle" colspan="3" align="left">ASMR</th>
</tr>
<tr>
<td valign="middle" align="left">Both</td>
<td valign="middle" align="left">0.47 (0.4,0.55)</td>
<td valign="middle" align="left">0.39 (0.31,0.47)</td>
</tr>
<tr>
<td valign="middle" align="left">Female</td>
<td valign="middle" align="left">0.57 (0.43, 0.69)</td>
<td valign="middle" align="left">0.32 (0.24,0.45)</td>
</tr>
<tr>
<td valign="middle" align="left">Male</td>
<td valign="middle" align="left">0.38 (0.31,0.51)</td>
<td valign="middle" align="left">0.49 (0.33,0.64)</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="s3_2">
<label>3.2</label>
<title>Mortality rate of thyroid in China from 1990 to 2021</title>
<p>In 1990 (<xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1B</bold>
</xref>), the crude mortality rate of the age group under 50 in China was close to 0. It began to change significantly at the age of 50. Before age 80, women had a higher mortality rate than men. After the age of 80, the mortality rate of men increased rapidly and reached its peak between the ages of 90 and 94. By 2021 (<xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1D</bold>
</xref>), the crude death rate for the under-50 age group remained close to zero. The mortality gap between men and women remained small until age 75. However, the mortality rate for men increased rapidly after the age of 75, reaching its peak at 90-94 years old. Furthermore, compared with 1990, the mortality rate of men is increasing while that of women is decreasing. Despite these changes, the overall mortality trends of both sexes remain similar.</p>
<p>The AMPR of the entire population decreased from 0.47 (0.4, 0.55) in 1990 to 0.39 (0.31, 0.47). The AMPR of men increased from 0.38 (0.31, 0.51) to 0.49 (0.33, 0.64), while that of women decreased from 0.57 (0.43, 0.69) to 0.32 (0.24, 0.45) (<xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref>).</p>
</sec>
<sec id="s3_3">
<label>3.3</label>
<title>Analysis of risk factors for death from thyroid cancer</title>
<p>Based on the data analysis of GBD 2021, the risk of death from thyroid cancer caused by high body mass index (BMI) in China showed a significant increasing trend from 1990 to 2021.As shown in <xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2</bold>
</xref>, the proportion of deaths from thyroid cancer due to high BMI in males increased from 6.89% to 10.40% (an increase of 50.97%), and in females it increased from 7.84% to 12% (an increase of 53.06%).</p>
<fig id="f2" position="float">
<label>Figure&#xa0;2</label>
<caption>
<p>Analysis of risk factors for death. x-axis: Year; y-axis: Percentage of deaths.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fendo-16-1644396-g002.tif">
<alt-text content-type="machine-generated">Line chart depicting the percentage of deaths from 1990 to 2020. Multiple lines represent different categories, all showing an upward trend. The y-axis ranges from 5% to 14%, and the x-axis covers the years.</alt-text>
</graphic>
</fig>
<p>It is worth noting that metabolic risks associated with female obesity may be more sensitive to the prognosis of thyroid cancer. Overall, high BMI remains a key modifiable risk factor, with a more pronounced impact on women.</p>
</sec>
<sec id="s3_4">
<label>3.4</label>
<title>Relationship between BMI and thyroid cancer through MR analysis</title>
<p>Using BMI as the exposure variable and thyroid cancer as the outcome variable, select SNPs related to BMI as instrumental variables, and meet the following conditions: (1) Association hypothesis: Select SNP loci that are strongly correlated with exposure factors to ensure that the selected SNPs accurately reflect the genetic characteristics of thyroid cancer. (2) Independence hypothesis: SNP loci associated with confounding factors were excluded to eliminate the influence of external interference on the research results. (3) Exclusivity assumption: Only SNP loci that have an effect on the junction through exposure factors are retained to ensure the uniqueness of the causal relationship (<xref ref-type="bibr" rid="B32">32</xref>, <xref ref-type="bibr" rid="B33">33</xref>).</p>
<p>When choosing tools, set the significance threshold at P&lt;5&#xd7;10-6 to preliminarily screen SNPS that are significantly related to BMI (<xref ref-type="bibr" rid="B34">34</xref>). Then, set the linkage disequilibrium parameter r2 = 0.001 and the genetic distance to 10,000 kb to avoid the bias caused by the linkage disequilibrium among SNPS. To conform to the exclusivity hypothesis, P&lt;5&#xd7;10-6 was set to eliminate SNPS related to the outcome (<xref ref-type="bibr" rid="B35">35</xref>). To meet the independence hypothesis, SNPS related to confounding factors need to be eliminated, and PheoScanner is used to query SNP-related models.</p>
<p>Through MR Analysis, there is a positive causal relationship between thyroid cancer and BMI(MR-Egger: OR=1.822, 95%CI: 0.1414-23.519, P=0.0646; IVW: OR=0.953, 95%CI: 0.358-2.2535, P=0.00242, Weighted mode: OR=0.403,95%CI: 0.048-3.395, P=0.0404), as shown in <xref ref-type="table" rid="T2">
<bold>Table&#xa0;2</bold>
</xref>.</p>
<table-wrap id="T2" position="float">
<label>Table&#xa0;2</label>
<caption>
<p>Analysis of MR results with BMI as the exposure factor.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" align="left">Id.exposure</th>
<th valign="middle" align="left">Method</th>
<th valign="middle" align="left">Nsnp</th>
<th valign="middle" align="left">OR (95%CI)</th>
<th valign="middle" align="left">Pval</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" rowspan="3" align="left">BMI</td>
<td valign="middle" align="left">MR-Egger</td>
<td valign="middle" align="left">219</td>
<td valign="middle" align="left">1.822 (0.1414-23.519)</td>
<td valign="middle" align="left">0.0646</td>
</tr>
<tr>
<td valign="middle" align="left">IVW</td>
<td valign="middle" align="left">219</td>
<td valign="middle" align="left">0.953 (0.358-2.2535)</td>
<td valign="middle" align="left">0.00242</td>
</tr>
<tr>
<td valign="middle" align="left">Weighted mode</td>
<td valign="middle" align="left">219</td>
<td valign="middle" align="left">0.403 (0.048-3.395)</td>
<td valign="middle" align="left">0.0404</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>The IVW method is the most commonly used and statistically effective method in MR analysis. If the P value is less than 0.05, it is considered that there is statistical evidence supporting the causal effect of exposure on outcomes. However, the IVW method is highly sensitive to horizontal pleiotropy, and the estimation results of IVW may be biased. If the P-values of IVW and weighted median method are both significant and consistent in direction, this will enhance the conclusion of causal inference. The results showed that the P-values of IVW and Weighted mode were both less than 0.05, and the effect directions were consistent, indicating a causal relationship between BMI and thyroid cancer. This suggests that BMI may be an important factor in increasing the risk of thyroid cancer.</p>
</sec>
<sec id="s3_5">
<label>3.5</label>
<title>Prediction of multiple machine learning models based on SHAP interpretation</title>
<p>In order to better predict the future prevalence trend of thyroid cancer, we used ARIMA to predict the prevalence and mortality of thyroid cancer in the next 10 years. The prevalence is projected to rise from 20.01% in 2021 to 23.58% by 2031. The mortality rate is expected to remain stable, around 0.41%, during the same period. As shown in <xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3</bold>
</xref>.</p>
<fig id="f3" position="float">
<label>Figure&#xa0;3</label>
<caption>
<p>Forecast of the prevalence and mortality trends of thyroid cancer in China over the next 10 years (2021-2031). The real trends of prevalence and mortality in red lines. The yellow dotted lines and shaded areas represent the predicted trends and their 95%CI.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fendo-16-1644396-g003.tif">
<alt-text content-type="machine-generated">Two graphs comparing actual and forecasted values over the years from 1990 to 2030. Panel A shows ASPR, which rises steadily until 2020 and then projects upward. Panel B shows ASMR, remaining relatively stable with a slight forecasted rise after 2020. Both graphs use red for actual values and yellow for forecasts, with a dashed line marking the transition between actual and forecasted data.</alt-text>
</graphic>
</fig>
<p>Through the predictive analysis of GBD data, it was found that the prevalence of thyroid cancer still shows an increasing trend. To gain deeper insights into the current status and future progression of the disease, we built several machine learning models using hospital-based data. A total of 6,565 patients were included in this study, including 4,631 patients with malignant thyroid cancer and 1,934 patients with benign thyroid cancer. The data were randomly divided into the training set and the test set. The training set had a total of 5252 samples, and the test set had a total of 1313 samples.</p>
<p>For cases of missing data, Hot Deck Imputation was employed. Find the complete sample that is most similar to the missing value sample from the dataset, and use the value of this complete sample to fill in the missing value. The advantage of this method lies in its ability to preserve the original distribution of data, as it is filled based on actual observed values.</p>
<p>This study adopted a feature selection strategy that comprehensively considers clinical relevance, data availability and completeness, and model interpretability requirements when constructing a thyroid cancer benign and malignant prediction model. We carefully selected 9 clinical features closely related to thyroid disease diagnosis and patient basic information from hospital electronic medical records as model inputs.</p>
<p>Before conducting the model establishment analysis, the normality test of each index should be carried out first (<xref ref-type="bibr" rid="B36">36</xref>). When the P value of the normality test is greater than 0.05, it indicates that the index follows a normal distribution. The specific data are shown in <xref ref-type="table" rid="T3">
<bold>Table&#xa0;3</bold>
</xref>. The indicators that follow a normal distribution include age, BMI, TG,FT3 etc.</p>
<table-wrap id="T3" position="float">
<label>Table&#xa0;3</label>
<caption>
<p>Comparison of indicators related to benign and malignant thyroid.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" align="center">Eigenvalue</th>
<th valign="middle" align="center">Total (N=6565)</th>
<th valign="middle" align="center">Malignant (n=4631)</th>
<th valign="middle" align="center">Benign (N=1934)</th>
<th valign="middle" align="center">p.overall</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="center">sex, N (%):</td>
<td valign="middle" align="center"/>
<td valign="middle" align="center"/>
<td valign="middle" align="center"/>
<td valign="middle" align="center">0.727</td>
</tr>
<tr>
<td valign="middle" align="center">male</td>
<td valign="middle" align="center">1548 (23.580%)</td>
<td valign="middle" align="center">1086 (23.451%)</td>
<td valign="middle" align="center">462 (23.888%)</td>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="middle" align="center">female</td>
<td valign="middle" align="center">5017 (76.420%)</td>
<td valign="middle" align="center">3545 (76.549%)</td>
<td valign="middle" align="center">1472 (76.112%)</td>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="middle" align="center">age, Median [Q1-Q3]</td>
<td valign="middle" align="center">47.000 [38.000;56.000]</td>
<td valign="middle" align="center">45.000 [36.000;54.000]</td>
<td valign="middle" align="center">52.000 [43.000;60.000]</td>
<td valign="middle" align="center">&lt;0.001</td>
</tr>
<tr>
<td valign="middle" align="center">BMI, N (%):</td>
<td valign="middle" align="center"/>
<td valign="middle" align="center"/>
<td valign="middle" align="center"/>
<td valign="middle" align="center">0.000</td>
</tr>
<tr>
<td valign="middle" align="center">Overweight</td>
<td valign="middle" align="center">4590 (69.916%)</td>
<td valign="middle" align="center">4561 (98.488%)</td>
<td valign="middle" align="center">29 (1.499%)</td>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="middle" align="center">normal</td>
<td valign="middle" align="center">1960 (29.855%)</td>
<td valign="middle" align="center">61 (1.317%)</td>
<td valign="middle" align="center">1899 (98.190%)</td>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="middle" align="center">low weight</td>
<td valign="middle" align="center">15 (0.228%)</td>
<td valign="middle" align="center">9 (0.194%)</td>
<td valign="middle" align="center">6 (0.310%)</td>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="middle" align="center">TG, Median [Q1-Q3]</td>
<td valign="middle" align="center">19.250 [8.185;51.460]</td>
<td valign="middle" align="center">15.530 [6.785;33.555]</td>
<td valign="middle" align="center">44.200 [15.660;162.200]</td>
<td valign="middle" align="center">&lt;0.001</td>
</tr>
<tr>
<td valign="middle" align="center">TP0AB, Median [Q1-Q3]</td>
<td valign="middle" align="center">1.200 [0.500;11.918]</td>
<td valign="middle" align="center">0.500 [0.500;7.660]</td>
<td valign="middle" align="center">6.430 [0.500;16.780]</td>
<td valign="middle" align="center">&lt;0.001</td>
</tr>
<tr>
<td valign="middle" align="center">TGAB, Median [Q1-Q3]</td>
<td valign="middle" align="center">2.030 [0.500;16.053]</td>
<td valign="middle" align="center">1.600 [0.500;14.175]</td>
<td valign="middle" align="center">10.000 [1.110;18.778]</td>
<td valign="middle" align="center">&lt;0.001</td>
</tr>
<tr>
<td valign="middle" align="center">TSH, Median [Q1-Q3]</td>
<td valign="middle" align="center">1.672 [1.090;2.498]</td>
<td valign="middle" align="center">1.749 [1.183;2.572]</td>
<td valign="middle" align="center">1.466 [0.875;2.283]</td>
<td valign="middle" align="center">&lt;0.001</td>
</tr>
<tr>
<td valign="middle" align="center">FT4, Median [Q1-Q3]</td>
<td valign="middle" align="center">13.390 [12.180;15.000]</td>
<td valign="middle" align="center">13.100 [12.010;14.395]</td>
<td valign="middle" align="center">14.440 [12.718;16.600]</td>
<td valign="middle" align="center">&lt;0.001</td>
</tr>
<tr>
<td valign="middle" align="center">FT3, Median [Q1-Q3]</td>
<td valign="middle" align="center">4.365 [3.900;4.860]</td>
<td valign="middle" align="center">4.410 [4.000;4.890]</td>
<td valign="middle" align="center">4.200 [3.270;4.762]</td>
<td valign="middle" align="center">&lt;0.001</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>Six machine learning prediction models were constructed to predict the prevalence of thyroid cancer patients. During the model parameter tuning process, we utilized the grid search method. The aim is to find the optimal combination of hyperparameters through algorithms rather than manual trial and error, in order to achieve the best performance of the model. Predefine the discrete value range or list for each hyperparameter, and then iterate through all possible combinations of hyperparameters. For each combination, the model undergoes training and evaluation, followed by recording of performance metrics.</p>
<p>For the evaluation of the model, we utilized metrics such as AUC, accuracy, sensitivity, and specificity. The specific calculation formulas are as follows:</p>
<disp-formula>
<mml:math display="block" id="M1">
<mml:mrow>
<mml:mi>A</mml:mi>
<mml:mtext>ccuracy</mml:mtext>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mi>P</mml:mi>
<mml:mo>+</mml:mo>
<mml:mi>T</mml:mi>
<mml:mi>N</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mi>P</mml:mi>
<mml:mo>+</mml:mo>
<mml:mi>T</mml:mi>
<mml:mi>N</mml:mi>
<mml:mo>+</mml:mo>
<mml:mi>F</mml:mi>
<mml:mi>P</mml:mi>
<mml:mo>+</mml:mo>
<mml:mi>F</mml:mi>
<mml:mi>N</mml:mi>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
</disp-formula>
<disp-formula>
<mml:math display="block" id="M2">
<mml:mrow>
<mml:mi>S</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>n</mml:mi>
<mml:mi>s</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>v</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>y</mml:mi>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mi>P</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mi>P</mml:mi>
<mml:mo>+</mml:mo>
<mml:mi>F</mml:mi>
<mml:mi>N</mml:mi>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
</disp-formula>
<disp-formula>
<mml:math display="block" id="M3">
<mml:mrow>
<mml:mi>S</mml:mi>
<mml:mi>p</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>c</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>f</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>c</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>y</mml:mi>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mi>N</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mi>N</mml:mi>
<mml:mo>+</mml:mo>
<mml:mi>F</mml:mi>
<mml:mi>P</mml:mi>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
</disp-formula>
<p>True Positive (TP): The number of samples that are actually positive and also predicted as positive. True Negative (TN): The number of samples that are actually negative and also predicted as negative. False Positive (FP): The number of samples that are actually negative but are predicted as positive. False Negative (FN): The number of samples that are actually positive but are predicted as negative. <xref ref-type="table" rid="T4">
<bold>Table&#xa0;4</bold>
</xref> shows the performance evaluation indicators of the six machine learning models constructed in this study (XGBoost, RandomForest, DecisionTree, GNB, MLP, SVM) in predicting the benign and malignant nature of thyroid cancer. The XGBoost model exhibits the best overall predictive performance. Its AUC value is as high as 0.999, accuracy is 0.984, sensitivity is 0.973, specificity is 0.988, positive predictive value is 0.968, negative predictive value is 0.990, and F1 score is 0.971. This indicates that XGBoost has extremely high accuracy and robustness in distinguishing benign and malignant thyroid cancer. In contrast, the performance of MLP and SVM is relatively poor. The AUC of MLP is only 0.661, the accuracy is 0.715, the sensitivity is only 0.469, and the F1 score is 0.480, indicating that its performance in this thyroid cancer benign and malignant prediction task is not ideal. Therefore, the XGBoost model based on gradient boosting demonstrated excellent performance in the benign and malignant prediction task of thyroid cancer in this study, far surpassing other traditional machine learning methods.</p>
<table-wrap id="T4" position="float">
<label>Table&#xa0;4</label>
<caption>
<p>Comparison of results from multiple models.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" align="center">Models</th>
<th valign="middle" align="center">AUC</th>
<th valign="middle" align="center">Accuracy</th>
<th valign="middle" align="center">Sensitivity</th>
<th valign="middle" align="center">Specificity</th>
<th valign="middle" align="center">Positive predictive value</th>
<th valign="middle" align="center">Negative predictive value</th>
<th valign="middle" align="center">F1 score</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="center">XGBoost</td>
<td valign="middle" align="center">0.999</td>
<td valign="middle" align="center">0.984</td>
<td valign="middle" align="center">0.973</td>
<td valign="middle" align="center">0.988</td>
<td valign="middle" align="center">0.968</td>
<td valign="middle" align="center">0.990</td>
<td valign="middle" align="center">0.971</td>
</tr>
<tr>
<td valign="middle" align="center">RandomForest</td>
<td valign="middle" align="center">0.997</td>
<td valign="middle" align="center">0.987</td>
<td valign="middle" align="center">0.985</td>
<td valign="middle" align="center">0.987</td>
<td valign="middle" align="center">0.967</td>
<td valign="middle" align="center">0.994</td>
<td valign="middle" align="center">0.976</td>
</tr>
<tr>
<td valign="middle" align="center">DecisionTree</td>
<td valign="middle" align="center">0.979</td>
<td valign="middle" align="center">0.983</td>
<td valign="middle" align="center">0.970</td>
<td valign="middle" align="center">0.988</td>
<td valign="middle" align="center">0.970</td>
<td valign="middle" align="center">0.988</td>
<td valign="middle" align="center">0.970</td>
</tr>
<tr>
<td valign="middle" align="center">GNB</td>
<td valign="middle" align="center">0.991</td>
<td valign="middle" align="center">0.984</td>
<td valign="middle" align="center">0.989</td>
<td valign="middle" align="center">0.982</td>
<td valign="middle" align="center">0.953</td>
<td valign="middle" align="center">0.996</td>
<td valign="middle" align="center">0.971</td>
</tr>
<tr>
<td valign="middle" align="center">MLP</td>
<td valign="middle" align="center">0.661</td>
<td valign="middle" align="center">0.715</td>
<td valign="middle" align="center">0.469</td>
<td valign="middle" align="center">0.811</td>
<td valign="middle" align="center">0.492</td>
<td valign="middle" align="center">0.796</td>
<td valign="middle" align="center">0.480</td>
</tr>
<tr>
<td valign="middle" align="center">SVM</td>
<td valign="middle" align="center">0.838</td>
<td valign="middle" align="center">0.769</td>
<td valign="middle" align="center">0.831</td>
<td valign="middle" align="center">0.743</td>
<td valign="middle" align="center">0.569</td>
<td valign="middle" align="center">0.917</td>
<td valign="middle" align="center">0.675</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>The importance of features and the interpretability of the model are key aspects in evaluating performance. In the XGBoost model, BMI has the greatest influence among the nine common clinical features, as shown in <xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4</bold>
</xref>. The SHAP graph illustrates how each feature contributes to the model by displaying the distribution of SHAP values. The horizontal axis represents the SHAP value of the XGBoost model, and the color of the points indicates the size of the feature value. If the SHAP is positive, it indicates that the feature has a positive contribution.</p>
<fig id="f4" position="float">
<label>Figure&#xa0;4</label>
<caption>
<p>SHAP values.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fendo-16-1644396-g004.tif">
<alt-text content-type="machine-generated">SHAP summary plot showing feature impact on model output. Features like BMI, TG, TSH, and others are listed on the y-axis. The x-axis indicates SHAP values ranging from -0.2 to 1.0. Dots represent feature values, colored from blue (low) to red (high), illustrating their significance in model predictions. BMI has the most significant positive impact.</alt-text>
</graphic>
</fig>
<p>From <xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4</bold>
</xref>, it can be clearly seen that the SHAP value distribution range of BMI is the widest, and its points are mainly concentrated in the larger positive areas. This indicates that BMI is the most important clinical feature affecting the prediction of benign and malignant thyroid cancer. A high BMI value is associated with a higher SHAP value, indicating that a high BMI significantly increases the likelihood of the model predicting malignancy. This is consistent with the conclusion drawn from Mendelian randomization analysis in the study that there is a positive causal relationship between BMI and thyroid cancer, further emphasizing the crucial role of BMI in the occurrence and development of thyroid cancer.</p>
</sec>
</sec>
<sec id="s4" sec-type="discussion">
<label>4</label>
<title>Discussion</title>
<p>This study aims to conduct an in-depth analysis of the disease patterns and future trends of thyroid cancer in China, and to construct an intelligent prediction model in combination with hospital electronic medical record data. It was found that the incidence of thyroid cancer in China has significantly increased, which is consistent with the global trend (<xref ref-type="bibr" rid="B37">37</xref>) and epidemiological analysis within China (<xref ref-type="bibr" rid="B38">38</xref>). The higher prevalence rate among women may be linked to hormone levels, autoimmune thyroid disease, and more frequent screenings. The peak age of onset for women has shifted from 55-59 years old in 1990 to 60-64 years old in 2021, which may reflect the aging of the population, the advancement of diagnostic techniques, and the evolution of the natural history of diseases. Although the prevalence rate continues to rise, the overall mortality rate remains relatively stable. This might be due to the popularization of early diagnosis, the advancement of treatment methods and the improvement of public health awareness. However, the rising trend of male mortality suggests that more in-depth attention should be paid to the risk factors and prognosis of thyroid cancer in men.</p>
<p>This study is the first to combine macroscopic GBD data with microscopic electronic medical record data from our hospital, providing a comprehensive perspective from the national level to clinical practice. This integration compensates for the limitations of a single data source (<xref ref-type="bibr" rid="B39">39</xref>), allowing research results to reflect the trend of disease burden nationwide and delve into the clinical characteristics of individual patients, providing a more solid foundation for developing precise prevention and control strategies.</p>
<p>This study introduced Mendelian randomization analysis to validate the relationship between BMI and thyroid cancer from a genetic causal perspective, which is relatively rare in previous research on thyroid cancer in China (<xref ref-type="bibr" rid="B40">40</xref>). The number of deaths from thyroid cancer caused by high BMI has surged in the past thirty years, which is consistent with the global trend of obesity and emphasizes the important role of obesity in the occurrence and development of thyroid cancer (<xref ref-type="bibr" rid="B41">41</xref>, <xref ref-type="bibr" rid="B42">42</xref>). The results of MR analysis provide strong evidence that BMI is not only an accompanying phenomenon of thyroid cancer, but also an independent risk factor. This may be related to mechanisms such as chronic inflammation, insulin resistance, and endocrine disorders caused by obesity (<xref ref-type="bibr" rid="B43">43</xref>), providing new targets and stronger evidence support for the prevention and intervention of thyroid cancer.</p>
<p>This study constructed and compared various advanced machine learning models such as XGBoost and RandomForest (<xref ref-type="bibr" rid="B44">44</xref>), achieving high-precision prediction of benign and malignant thyroid cancer. The XGBoost model showed the best predictive performance, with an AUC value of up to 0.999, far exceeding the predictive ability of traditional statistical methods. More importantly, this study used interpretable methods such as SHAP values (<xref ref-type="bibr" rid="B45">45</xref>) to reveal key predictive features, clarifying that BMI is the most important clinical feature affecting thyroid cancer prediction, followed by thyroid function indicators such as TG, TSH, FT3, FT4, which are consistent with the physiological and pathological basis of thyroid disease (<xref ref-type="bibr" rid="B46">46</xref>). This interpretability not only enhances the transparency and clinical practicality of the model, but also provides a basis for clinical doctors to understand the decision-making process of the model, surpassing the limitations of traditional statistical methods and providing intelligent support for clinical decision-making.</p>
<p>This study analyzed the relationship between BMI and thyroid cancer by integrating GBD data and electronic medical record data and applying machine learning methods, successfully constructing a predictive model. Based on these findings, we propose the following multi-level implementation suggestions, aiming to translate research findings into practical actions to improve the prevention, diagnosis, and management of thyroid cancer. At the data level, we suggest further in-depth exploration of the GBD data, conducting refined regional and subgroup analyses to reveal the association patterns between BMI and thyroid cancer under different contexts. At the methodological level, we should actively promote the deployment and optimization of the machine learning prediction model developed in this study in clinical practice, integrate it into auxiliary diagnostic systems, and continuously collect new data for model retraining and interpretability research, ensuring its accuracy and practicality.</p>
<p>At the clinical practice level, it is recommended to focus on strengthening early screening and risk assessment for thyroid cancer, especially for individuals with a high BMI. This includes strengthening BMI monitoring during routine physical examinations and providing earlier or more frequent thyroid ultrasound examinations for overweight or obese individuals. At the policy and public health levels, it is recommended that the government and health departments formulate and refine national-level obesity prevention and control strategies, and integrate them organically with the prevention and control of thyroid diseases. Meanwhile, based on the macro data analysis of this study, it is advisable to guide the rational allocation of medical resources and allocate more resources to the screening and management of high-incidence areas or high-risk populations for thyroid cancer.</p>
</sec>
<sec id="s5" sec-type="conclusions">
<label>5</label>
<title>Conclusions</title>
<p>This study comprehensively analyzed the disease burden pattern of thyroid cancer in China from 1990 to 2021, revealing the significant upward trend of prevalence and the causal role of high BMI as an important controllable risk factor. By combining global disease burden data with hospital electronic medical records and applying advanced statistical and machine learning methods, we offered a comprehensive view of the epidemiological evolution of thyroid cancer in China. We also successfully built a high-precision prediction model for benign and malignant thyroid cancer. These findings provide a solid scientific basis for formulating more precise and effective strategies for the prevention, early diagnosis and management of thyroid cancer in China and even globally. This study emphasizes the importance of strengthening obesity intervention at the public health level and provides a feasible path for the use of artificial intelligence-assisted diagnosis in clinical practice. Looking to the future, the achievements of this study will lay a solid foundation for further in-depth exploration of the complex etiology of thyroid cancer, optimization of the diagnosis and treatment process, and ultimately improvement of patients&#x2019; health outcomes.</p>
</sec>
</body>
<back>
<sec id="s6" sec-type="data-availability">
<title>Data availability statement</title>
<p>The original contributions presented in the study are included in the article/<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Material</bold>
</xref>. Further inquiries can be directed to the corresponding author.</p>
</sec>
<sec id="s7" sec-type="ethics-statement">
<title>Ethics statement</title>
<p>The studies involving humans were approved by Medical Ethics Committee of Shandong Provincial Third Hospital(No.KYLL-2021100). The studies were conducted in accordance with the local legislation and institutional requirements. Written informed consent for participation was not required from the participants or the participants&#x2019; legal guardians/next of kin because the study is a retrospective algorithmic research that only extracts patient testing related information and does not involve patient privacy information; And without intervening with patients, there will be no risk of medical or privacy leakage to patients.</p>
</sec>
<sec id="s8" sec-type="author-contributions">
<title>Author contributions</title>
<p>LY: Writing &#x2013; original draft, Data curation, Methodology, Writing &#x2013; review &amp; editing. SZ: Writing &#x2013; original draft, Supervision, Software. XW: Formal Analysis, Investigation, Writing &#x2013; review &amp; editing. JY: Validation, Funding acquisition, Writing &#x2013; review &amp; editing. MC: Investigation, Writing &#x2013; review &amp; editing, Validation, Formal Analysis, Writing &#x2013; original draft.</p>
</sec>
<sec id="s9" sec-type="funding-information">
<title>Funding</title>
<p>The author(s) declare financial support was received for the research and/or publication of this article. This study was supported by the Natural Science Foundation of Shandong Province (nos. ZR2021MH227), and Jinan Science and Technology Bureau plan (202019181).</p>
</sec>
<sec id="s10" sec-type="COI-statement">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec id="s11" sec-type="ai-statement">
<title>Generative AI statement</title>
<p>The author(s) declare that no Generative AI was used in the creation of this manuscript.</p>
<p>Any alternative text (alt text) provided alongside figures in this article has been generated by Frontiers with the support of artificial intelligence and reasonable efforts have been made to ensure accuracy, including review by the authors wherever possible. If you identify any issues, please contact us.</p>
</sec>
<sec id="s12" sec-type="disclaimer">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec id="s13" sec-type="supplementary-material">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fendo.2025.1644396/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fendo.2025.1644396/full#supplementary-material</ext-link>
</p>
<supplementary-material xlink:href="Table1.xlsx" id="SM1" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<label>1</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sung</surname> <given-names>H</given-names>
</name>
<name>
<surname>Ferlay</surname> <given-names>J</given-names>
</name>
<name>
<surname>Siegel</surname> <given-names>RL</given-names>
</name>
<name>
<surname>Laversanne</surname> <given-names>M</given-names>
</name>
<name>
<surname>Soerjomataram</surname> <given-names>I</given-names>
</name>
<name>
<surname>Jemal</surname> <given-names>A</given-names>
</name>
<etal/>
</person-group>. <article-title>Global cancer statistics 2020: GLOBOCAN estimates of incidence and mortality worldwide for 36 cancers in 185 countries</article-title>. <source>CA Cancer J Clin</source>. (<year>2021</year>) <volume>71</volume>:<page-range>209&#x2013;49</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.3322/caac.21660</pub-id>, PMID: <pub-id pub-id-type="pmid">33538338</pub-id></citation></ref>
<ref id="B2">
<label>2</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bray</surname> <given-names>F</given-names>
</name>
<name>
<surname>Ferlay</surname> <given-names>J</given-names>
</name>
<name>
<surname>Soerjomataram</surname> <given-names>I</given-names>
</name>
<name>
<surname>Siegel</surname> <given-names>RL</given-names>
</name>
<name>
<surname>Torre</surname> <given-names>LA</given-names>
</name>
<name>
<surname>Jemal</surname> <given-names>A</given-names>
</name>
</person-group>. <article-title>Global cancer statistics 2018: GLOBOCAN estimates of incidence and mortality worldwide for 36 cancers in 185 countries</article-title>. <source>CA Cancer J Clin</source>. (<year>2018</year>) <volume>68</volume>:<fpage>394</fpage>&#x2013;<lpage>424</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.3322/caac.21492</pub-id>, PMID: <pub-id pub-id-type="pmid">30207593</pub-id></citation></ref>
<ref id="B3">
<label>3</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kitahara</surname> <given-names>CM</given-names>
</name>
<name>
<surname>Sosa</surname> <given-names>JA</given-names>
</name>
</person-group>. <article-title>Understanding the ever-changing incidence of thyroid cancer</article-title>. <source>Nat Rev Endocrinol</source>. (<year>2020</year>) <volume>16</volume>:<page-range>617&#x2013;8</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41574-020-00414-9</pub-id>, PMID: <pub-id pub-id-type="pmid">32895503</pub-id></citation></ref>
<ref id="B4">
<label>4</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dhir</surname> <given-names>G</given-names>
</name>
<name>
<surname>Jain</surname> <given-names>V</given-names>
</name>
<name>
<surname>Merritt</surname> <given-names>A</given-names>
</name>
</person-group>. <article-title>THYROID DISORDERS</article-title>. <source>Prof Med J</source>. (<year>2025</year>) <volume>3</volume>:<page-range>405&#x2013;15</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.29309/TPMJ/2015.22.10.982</pub-id>
</citation></ref>
<ref id="B5">
<label>5</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Qin</surname> <given-names>J</given-names>
</name>
<name>
<surname>Shi</surname> <given-names>X</given-names>
</name>
</person-group>. <article-title>Research progress in the etiology of thyroid cancer</article-title>. <source>Chin J Otorhinolaryngol Head Neck Surg</source>. (<year>2020</year>) <volume>55</volume>:<page-range>711&#x2013;5</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.3760/cma.j.cn115330-20191226-00783</pub-id>, PMID: <pub-id pub-id-type="pmid">32668886</pub-id></citation></ref>
<ref id="B6">
<label>6</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname> <given-names>Z</given-names>
</name>
</person-group>. <article-title>Emotional disorder and related psychosocial factors in tumor patients</article-title>. <source>Chin J Rehabil Theory Pract</source>. (<year>2017</year>).</citation></ref>
<ref id="B7">
<label>7</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wu</surname> <given-names>B-j</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>M-j</given-names>
</name>
</person-group>. <article-title>Investigation of psychological health status in Malignant tumor patients</article-title>. <source>Int J Nurs</source>. (<year>2015</year>) <volume>00</volume>:<page-range>1315&#x2013;7</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.3760/CMA.J.ISSN.1673-4351.2015.10.008</pub-id>
</citation></ref>
<ref id="B8">
<label>8</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cao</surname> <given-names>W</given-names>
</name>
<name>
<surname>Qin</surname> <given-names>K</given-names>
</name>
<name>
<surname>Li</surname> <given-names>F</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>W</given-names>
</name>
</person-group>. <article-title>Socioeconomic inequalities in cancer incidence and mortality: An analysis of GLOBOCAN 2022</article-title>. <source>Chin Med J (Engl)</source>. (<year>2024</year>) <volume>12</volume>:<page-range>1407&#x2013;13</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1097/CM9.0000000000003140</pub-id>, PMID: <pub-id pub-id-type="pmid">38616547</pub-id></citation></ref>
<ref id="B9">
<label>9</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<collab>GBD 2019 Risk Factors Collaborators</collab>
</person-group>. <article-title>Global burden of 87 risk factors in 204 countries and territories, 1990-2019: a systematic analysis for the Global Burden of Disease Study 2019</article-title>. <source>Lancet</source>. (<year>2020</year>) <volume>396</volume>:<page-range>1223&#x2013;49</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/S0140-6736(20)30752-2</pub-id>
</citation></ref>
<ref id="B10">
<label>10</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Deng</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Li</surname> <given-names>H</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>M</given-names>
</name>
<name>
<surname>Li</surname> <given-names>N</given-names>
</name>
<name>
<surname>Tian</surname> <given-names>T</given-names>
</name>
<name>
<surname>Wu</surname> <given-names>Y</given-names>
</name>
<etal/>
</person-group>. <article-title>Global burden of thyroid cancer from 1990 to 2017</article-title>. <source>JAMA Netw Open</source>. (<year>2020</year>) <volume>3</volume>:<elocation-id>e208759</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1001/jamanetworkopen.2020.8759</pub-id>, PMID: <pub-id pub-id-type="pmid">32589231</pub-id></citation></ref>
<ref id="B11">
<label>11</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cheng</surname> <given-names>F</given-names>
</name>
<name>
<surname>Xiao</surname> <given-names>J</given-names>
</name>
<name>
<surname>Shao</surname> <given-names>C</given-names>
</name>
<name>
<surname>Huang</surname> <given-names>F</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>L</given-names>
</name>
<name>
<surname>Ju</surname> <given-names>Y</given-names>
</name>
<etal/>
</person-group>. <article-title>Burden of thyroid cancer from 1990 to 2019 and projections of incidence and mortality until 2039 in China: findings from global burden of disease study</article-title>. <source>Front Endocrinol (Lausanne)</source>. (<year>2021</year>) <volume>12</volume>:<elocation-id>738213</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fendo.2021.738213</pub-id>, PMID: <pub-id pub-id-type="pmid">34690931</pub-id></citation></ref>
<ref id="B12">
<label>12</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wu</surname> <given-names>J</given-names>
</name>
<name>
<surname>Zhao</surname> <given-names>X</given-names>
</name>
<name>
<surname>Sun</surname> <given-names>J</given-names>
</name>
<name>
<surname>Cheng</surname> <given-names>C</given-names>
</name>
<name>
<surname>Yin</surname> <given-names>C</given-names>
</name>
<name>
<surname>Bai</surname> <given-names>R</given-names>
</name>
</person-group>. <article-title>The epidemic of thyroid cancer in China: Current trends and future prediction</article-title>. <source>Front Oncol</source>. (<year>2022</year>) <volume>12</volume>:<elocation-id>932729</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fonc.2022.932729</pub-id>, PMID: <pub-id pub-id-type="pmid">36119514</pub-id></citation></ref>
<ref id="B13">
<label>13</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jin</surname> <given-names>S</given-names>
</name>
<name>
<surname>Luo</surname> <given-names>L</given-names>
</name>
<name>
<surname>Xu</surname> <given-names>X</given-names>
</name>
<name>
<surname>Xia</surname> <given-names>K</given-names>
</name>
</person-group>. <article-title>Thyroid cancer burden and risk factors in China from 1990-2019: a systematic analysis using the global burden of disease study</article-title>. <source>Front Oncol</source>. (<year>2023</year>) <volume>13</volume>:<elocation-id>1231636</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fonc.2023.1231636</pub-id>, PMID: <pub-id pub-id-type="pmid">38023126</pub-id></citation></ref>
<ref id="B14">
<label>14</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xu</surname> <given-names>L</given-names>
</name>
<name>
<surname>Cao</surname> <given-names>ZX</given-names>
</name>
<name>
<surname>Weng</surname> <given-names>X</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>CF</given-names>
</name>
</person-group>. <article-title>Global thyroid cancer incidence trend and age-period-cohort model analysis based on Global Burden of Disease Study from 1990 to 2019</article-title>. <source>Front Endocrinol (Lausanne)</source>. (<year>2023</year>) <volume>14</volume>:<elocation-id>1133098</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fendo.2023.1133098</pub-id>, PMID: <pub-id pub-id-type="pmid">37124740</pub-id></citation></ref>
<ref id="B15">
<label>15</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cui</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Mubarik</surname> <given-names>S</given-names>
</name>
<name>
<surname>Li</surname> <given-names>R</given-names>
</name>
<name>
<surname>Nawsherwan</surname>
</name>
<name>
<surname>Yu</surname> <given-names>C</given-names>
</name>
</person-group>. <article-title>Trend dynamics of thyroid cancer incidence among China and the U.S. adult population from 1990 to 2017: a joinpoint and age-period-cohort analysis</article-title>. <source>BMC Public Health</source>. (<year>2021</year>) <volume>21</volume>:<fpage>624</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s12889-021-10635-w</pub-id>, PMID: <pub-id pub-id-type="pmid">33789605</pub-id></citation></ref>
<ref id="B16">
<label>16</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Schuster-Bruce</surname> <given-names>J</given-names>
</name>
<name>
<surname>Jani</surname> <given-names>C</given-names>
</name>
<name>
<surname>Goodall</surname> <given-names>R</given-names>
</name>
<name>
<surname>Kim</surname> <given-names>D</given-names>
</name>
<name>
<surname>Hughes</surname> <given-names>W</given-names>
</name>
<name>
<surname>Salciccioli</surname> <given-names>JD</given-names>
</name>
<etal/>
</person-group>. <article-title>A comparison of the burden of thyroid cancer among the European union 15+ Countries, 1990-2019: estimates from the global burden of disease study</article-title>. <source>JAMA Otolaryngol Head Neck Surg</source>. (<year>2022</year>) <volume>148</volume>:<page-range>350&#x2013;9</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1001/jamaoto.2021.4549</pub-id>, PMID: <pub-id pub-id-type="pmid">35266977</pub-id></citation></ref>
<ref id="B17">
<label>17</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname> <given-names>C</given-names>
</name>
<name>
<surname>Wu</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Lei</surname> <given-names>L</given-names>
</name>
<name>
<surname>Dong</surname> <given-names>X</given-names>
</name>
<name>
<surname>Cao</surname> <given-names>W</given-names>
</name>
<name>
<surname>Luo</surname> <given-names>Z</given-names>
</name>
<etal/>
</person-group>. <article-title>Geographic disparities in trends of thyroid cancer incidence and mortality from 1990 to 2019 and a projection to 2030 across income-classified countries and territories</article-title>. <source>J Glob Health</source>. (<year>2023</year>) <volume>13</volume>:<fpage>04108</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.7189/jogh.13.04108</pub-id>, PMID: <pub-id pub-id-type="pmid">37766638</pub-id></citation></ref>
<ref id="B18">
<label>18</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rahman</surname> <given-names>ST</given-names>
</name>
<name>
<surname>Pandeya</surname> <given-names>N</given-names>
</name>
<name>
<surname>Neale</surname> <given-names>RE</given-names>
</name>
<name>
<surname>McLeod</surname> <given-names>DSA</given-names>
</name>
<name>
<surname>Bain</surname> <given-names>CJ</given-names>
</name>
<name>
<surname>Baade</surname> <given-names>PD</given-names>
</name>
<etal/>
</person-group>. <article-title>Obesity is associated with BRAF(V600E)-mutated thyroid cancer</article-title>. <source>Thyroid</source>. (<year>2020</year>) <volume>30</volume>:<page-range>1518&#x2013;27</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1089/thy.2019.0654</pub-id>, PMID: <pub-id pub-id-type="pmid">32228152</pub-id></citation></ref>
<ref id="B19">
<label>19</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname> <given-names>J</given-names>
</name>
<name>
<surname>Ma</surname> <given-names>B</given-names>
</name>
<name>
<surname>Han</surname> <given-names>X</given-names>
</name>
<name>
<surname>Ding</surname> <given-names>S</given-names>
</name>
<name>
<surname>Li</surname> <given-names>Y</given-names>
</name>
</person-group>. <article-title>Global, regional, and national burdens of HIV and other sexually transmitted infections in adolescents and young adults aged 10-24 years from 1990 to 2019: a trend analysis based on the Global Burden of Disease Study 2019</article-title>. <source>Lancet Child Adolesc Health</source>. (<year>2022</year>) <volume>6</volume>:<page-range>763&#x2013;76</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/S2352-4642(22)00219-X</pub-id>, PMID: <pub-id pub-id-type="pmid">36108664</pub-id></citation></ref>
<ref id="B20">
<label>20</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jain</surname> <given-names>S</given-names>
</name>
<name>
<surname>Agrawal</surname> <given-names>S</given-names>
</name>
<name>
<surname>Mohapatra</surname> <given-names>E</given-names>
</name>
<name>
<surname>Srinivasan</surname> <given-names>K</given-names>
</name>
</person-group>. <article-title>A novel ensemble ARIMA-LSTM approach for evaluating COVID-19 cases and future outbreak preparedness</article-title>. <source>Health Care Sci</source>. (<year>2024</year>) <volume>3</volume>:<page-range>409&#x2013;25</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/hcs2.123</pub-id>, PMID: <pub-id pub-id-type="pmid">39735282</pub-id></citation></ref>
<ref id="B21">
<label>21</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Schubert</surname> <given-names>C</given-names>
</name>
<name>
<surname>Seizer</surname> <given-names>L</given-names>
</name>
<name>
<surname>Chamson</surname> <given-names>E</given-names>
</name>
<name>
<surname>K&#xf6;nig</surname> <given-names>P</given-names>
</name>
<name>
<surname>Sepp</surname> <given-names>N</given-names>
</name>
<name>
<surname>Oca&#xf1;a-Peinado</surname> <given-names>FM</given-names>
</name>
<etal/>
</person-group>. <article-title>Real-life cause-effect relations between urinary IL-6 levels and specific and nonspecific symptoms in a patient with mild SLE disease activity</article-title>. <source>Front Immunol</source>. (<year>2021</year>) <volume>12</volume>:<elocation-id>718838</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fimmu.2021.718838</pub-id>, PMID: <pub-id pub-id-type="pmid">34975831</pub-id></citation></ref>
<ref id="B22">
<label>22</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname> <given-names>G</given-names>
</name>
<name>
<surname>Kuang</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Li</surname> <given-names>F</given-names>
</name>
<name>
<surname>Li</surname> <given-names>J</given-names>
</name>
</person-group>. <article-title>The causal relationship between gut microbiota and leukemia: a two-sample Mendelian randomization study</article-title>. <source>Front Microbiol</source>. (<year>2023</year>) <volume>14</volume>:<elocation-id>1293333</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fmicb.2023.1293333</pub-id>, PMID: <pub-id pub-id-type="pmid">38075916</pub-id></citation></ref>
<ref id="B23">
<label>23</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wu</surname> <given-names>D</given-names>
</name>
<name>
<surname>Zhou</surname> <given-names>J</given-names>
</name>
<name>
<surname>Huang</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Zheng</surname> <given-names>Q</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>T</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>L</given-names>
</name>
</person-group>. <article-title>Genetically predicted chilhood body mass index and lung cancer susceptibility:A two-sample Mendelian randomization study</article-title>. <source>Cancer Med</source>. (<year>2023</year>) <volume>12</volume>:<page-range>18418&#x2013;24</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/cam4.6406</pub-id>, PMID: <pub-id pub-id-type="pmid">37548289</pub-id></citation></ref>
<ref id="B24">
<label>24</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname> <given-names>J</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Lu</surname> <given-names>T</given-names>
</name>
<name>
<surname>Liang</surname> <given-names>R</given-names>
</name>
<name>
<surname>Wu</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>M</given-names>
</name>
<etal/>
</person-group>. <article-title>Identification of diagnostic genes for both Alzheimer&#x2019;s disease and Metabolic syndrome by the machine learning algorithm</article-title>. <source>Front Immunol</source>. (<year>2022</year>) <volume>13</volume>:<elocation-id>1037318</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fimmu.2022.1037318</pub-id>, PMID: <pub-id pub-id-type="pmid">36405716</pub-id></citation></ref>
<ref id="B25">
<label>25</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wen</surname> <given-names>J</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>C</given-names>
</name>
<name>
<surname>Xia</surname> <given-names>J</given-names>
</name>
<name>
<surname>Giri</surname> <given-names>M</given-names>
</name>
<name>
<surname>Guo</surname> <given-names>S</given-names>
</name>
</person-group>. <article-title>Relationship between serum iron and blood eosinophil counts in asthmatic adults: data from NHANES 2011-2018</article-title>. <source>Front Immunol</source>. (<year>2023</year>) <volume>14</volume>:<elocation-id>1201160</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fimmu.2023.1201160</pub-id>, PMID: <pub-id pub-id-type="pmid">37731511</pub-id></citation></ref>
<ref id="B26">
<label>26</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wei</surname> <given-names>C</given-names>
</name>
<name>
<surname>Wei</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Cheng</surname> <given-names>J</given-names>
</name>
<name>
<surname>Tan</surname> <given-names>X</given-names>
</name>
<name>
<surname>Zhou</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Lin</surname> <given-names>S</given-names>
</name>
<etal/>
</person-group>. <article-title>Identification and verification of diagnostic biomarkers in recurrent pregnancy loss via machine learning algorithm and WGCNA</article-title>. <source>Front Immunol</source>. (<year>2023</year>) <volume>14</volume>:<elocation-id>1241816</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fimmu.2023.1241816</pub-id>, PMID: <pub-id pub-id-type="pmid">37691920</pub-id></citation></ref>
<ref id="B27">
<label>27</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Talia</surname> <given-names>M</given-names>
</name>
<name>
<surname>Cesario</surname> <given-names>E</given-names>
</name>
<name>
<surname>Cirillo</surname> <given-names>F</given-names>
</name>
<name>
<surname>Scordamaglia</surname> <given-names>D</given-names>
</name>
<name>
<surname>Di Dio</surname> <given-names>M</given-names>
</name>
<name>
<surname>Zicarelli</surname> <given-names>A</given-names>
</name>
<etal/>
</person-group>. <article-title>Cancer-associated fibroblasts (CAFs) gene signatures predict outcomes in breast and prostate tumor patients</article-title>. <source>J Transl Med</source>. (<year>2024</year>) <volume>22</volume>:<fpage>597</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s12967-024-05413-2</pub-id>, PMID: <pub-id pub-id-type="pmid">38937754</pub-id></citation></ref>
<ref id="B28">
<label>28</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zuo</surname> <given-names>D</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>L</given-names>
</name>
<name>
<surname>Jin</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Qi</surname> <given-names>H</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Ren</surname> <given-names>L</given-names>
</name>
</person-group>. <article-title>Machine learning-based models for the prediction of breast cancer recurrence risk</article-title>. <source>BMC Med Inform Decis Mak</source>. (<year>2023</year>) <volume>23</volume>:<fpage>276</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s12911-023-02377-z</pub-id>, PMID: <pub-id pub-id-type="pmid">38031071</pub-id></citation></ref>
<ref id="B29">
<label>29</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sathish</surname> <given-names>T</given-names>
</name>
<name>
<surname>Sunagar</surname> <given-names>P</given-names>
</name>
<name>
<surname>Singh</surname> <given-names>V</given-names>
</name>
<name>
<surname>Boopathi</surname> <given-names>S</given-names>
</name>
<name>
<surname>Sathyamurthy</surname> <given-names>R</given-names>
</name>
<name>
<surname>Al-Enizi</surname> <given-names>AM</given-names>
</name>
<etal/>
</person-group>. <article-title>Characteristics estimation of natural fibre reinforced plastic composites using deep multi-layer perceptron (MLP) technique</article-title>. <source>Chemosphere</source>. (<year>2023</year>) <volume>337</volume>:<elocation-id>139346</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.chemosphere.2023.139346</pub-id>, PMID: <pub-id pub-id-type="pmid">37379988</pub-id></citation></ref>
<ref id="B30">
<label>30</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Youssef Ali Amer</surname> <given-names>A</given-names>
</name>
</person-group>. <article-title>Global-local least-squares support vector machine (GLocal-LS-SVM)</article-title>. <source>PloS One</source>. (<year>2023</year>) <volume>18</volume>:<elocation-id>e0285131</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1371/journal.pone.0285131</pub-id>, PMID: <pub-id pub-id-type="pmid">37104506</pub-id></citation></ref>
<ref id="B31">
<label>31</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wu</surname> <given-names>G</given-names>
</name>
<name>
<surname>Li</surname> <given-names>C</given-names>
</name>
<name>
<surname>Yin</surname> <given-names>L</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>J</given-names>
</name>
<name>
<surname>Zheng</surname> <given-names>X</given-names>
</name>
</person-group>. <article-title>Compared between support vector machine (SVM) and deep belief network (DBN) for multi-classification of Raman spectroscopy for cervical diseases</article-title>. <source>Photodiagnosis Photodyn Ther</source>. (<year>2023</year>) <volume>42</volume>:<elocation-id>103340</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.pdpdt.2023.103340</pub-id>, PMID: <pub-id pub-id-type="pmid">36858147</pub-id></citation></ref>
<ref id="B32">
<label>32</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wu</surname> <given-names>M</given-names>
</name>
<name>
<surname>An</surname> <given-names>ZX</given-names>
</name>
<name>
<surname>He</surname> <given-names>YL</given-names>
</name>
</person-group>. <article-title>Using Mendelian randomization to explore the causal association between gut microbiota and monalcoholic fatty liver disease</article-title>. <source>Acta Univ Med Anhui</source>. (<year>2024</year>) <volume>59</volume>:<page-range>236&#x2013;42</page-range>.</citation></ref>
<ref id="B33">
<label>33</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Salis</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Sainsbury</surname> <given-names>A,I</given-names>
</name>
<name>
<surname>Keen</surname> <given-names>H</given-names>
</name>
<name>
<surname>Gallego</surname> <given-names>B</given-names>
</name>
<name>
<surname>Jin</surname> <given-names>X</given-names>
</name>
</person-group>. <article-title>Weight loss is associated with reduced risk of knee and hip replacement: a survival analysis using Osteoarthritis Initiative data</article-title>. <source>Int J Obes</source>. (<year>2022</year>) <volume>46</volume>:<page-range>874&#x2013;84</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41366-021-01046-3</pub-id>, PMID: <pub-id pub-id-type="pmid">35017711</pub-id></citation></ref>
<ref id="B34">
<label>34</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cao</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Wu</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Li</surname> <given-names>Q</given-names>
</name>
<name>
<surname>Li</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Wu</surname> <given-names>J</given-names>
</name>
</person-group>. <article-title>A causal relationship between childhood obesity and risk of osteoarthritis: results from a two-sample Mendelian randomization analysis</article-title>. <source>Ann Med</source>. (<year>2022</year>) <volume>54</volume>:<page-range>1636&#x2013;45</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1080/07853890.2022.2085883</pub-id>, PMID: <pub-id pub-id-type="pmid">35703935</pub-id></citation></ref>
<ref id="B35">
<label>35</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Huang</surname> <given-names>JY</given-names>
</name>
<name>
<surname>Labrecque</surname> <given-names>JA</given-names>
</name>
</person-group>. <article-title>From GWAS to PheWAS: the search for causality in big data</article-title>. <source>Lancet Digit Health</source>. (<year>2019</year>) <volume>1</volume>:<page-range>e101&#x2013;e3</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/S2589-7500(19)30059-7</pub-id>, PMID: <pub-id pub-id-type="pmid">33323255</pub-id></citation></ref>
<ref id="B36">
<label>36</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ghasemi</surname> <given-names>A</given-names>
</name>
<name>
<surname>Zahediasl</surname> <given-names>S</given-names>
</name>
</person-group>. <article-title>Normality tests for statistical analysis: a guide for non-statisticians</article-title>. <source>Int J Endocrinol Metab</source>. (<year>2012</year>) <volume>10</volume>:<page-range>486&#x2013;9</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.5812/ijem.3505</pub-id>, PMID: <pub-id pub-id-type="pmid">23843808</pub-id></citation></ref>
<ref id="B37">
<label>37</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hu</surname> <given-names>S</given-names>
</name>
<name>
<surname>Wu</surname> <given-names>X</given-names>
</name>
<name>
<surname>Jiang</surname> <given-names>H</given-names>
</name>
</person-group>. <article-title>Trends and projections of the global burden of thyroid cancer from 1990 to 2030</article-title>. <source>J Glob Health</source>. (<year>2024</year>) <volume>14</volume>:<elocation-id>4084</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.7189/jogh.14.04084</pub-id>, PMID: <pub-id pub-id-type="pmid">38751316</pub-id></citation></ref>
<ref id="B38">
<label>38</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gong</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Jiang</surname> <given-names>Q</given-names>
</name>
<name>
<surname>Zhai</surname> <given-names>M</given-names>
</name>
<name>
<surname>Tang</surname> <given-names>T</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>S</given-names>
</name>
</person-group>. <article-title>Thyroid cancer trends in China and its comparative analysis with G20 countries: Projections for 2020&#x2013;2040</article-title>. <source>J Glob Health</source>. (<year>2024</year>) <volume>14</volume>:<fpage>04131</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.7189/jogh.14.04131</pub-id>, PMID: <pub-id pub-id-type="pmid">38873786</pub-id></citation></ref>
<ref id="B39">
<label>39</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Murray</surname> <given-names>CJ</given-names>
</name>
<name>
<surname>Lopez</surname> <given-names>AD</given-names>
</name>
<name>
<surname>Jamison</surname> <given-names>DT</given-names>
</name>
</person-group>. <article-title>The global burden of disease in 1990: summary results, sensitivity analysis and future directions</article-title>. <source>Bull World Health Organ</source>. (<year>1994</year>) <volume>72</volume>:<fpage>495</fpage>&#x2013;<lpage>509</lpage>., PMID: <pub-id pub-id-type="pmid">8062404</pub-id></citation></ref>
<ref id="B40">
<label>40</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jia</surname> <given-names>MJ</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>S</given-names>
</name>
<name>
<surname>Li</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>XN</given-names>
</name>
<name>
<surname>Jiang</surname> <given-names>F</given-names>
</name>
<name>
<surname>Li</surname> <given-names>HL</given-names>
</name>
</person-group>. <article-title>Global burden of thyroid cancer among adolescents and young adults, 1990-2021, and projections to 2050: an analysis based on the GBD 2021</article-title>. <source>Front Endocrinol (Lausanne)</source>. (<year>2025</year>) <volume>16</volume>:<elocation-id>1503144</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fendo.2025.1503144</pub-id>, PMID: <pub-id pub-id-type="pmid">40297175</pub-id></citation></ref>
<ref id="B41">
<label>41</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rafi</surname> <given-names>M</given-names>
</name>
<name>
<surname>Kanwal</surname> <given-names>MA</given-names>
</name>
<name>
<surname>Awais</surname> <given-names>M</given-names>
</name>
<name>
<surname>Ahmad</surname> <given-names>T</given-names>
</name>
<name>
<surname>Tayyab</surname> <given-names>M</given-names>
</name>
<name>
<surname>Naem</surname> <given-names>MS</given-names>
</name>
<etal/>
</person-group>. <article-title>Unveiling the Malignancy risk of surgically treated bethesda III thyroid nodules: A 10-year retrospective study comparing fine-needle aspiration cytology (FNAC) and histopathology</article-title>. <source>Cureus</source>. (<year>2024</year>) <volume>16</volume>:<elocation-id>e75855</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.7759/cureus.75855</pub-id>, PMID: <pub-id pub-id-type="pmid">39822453</pub-id></citation></ref>
<ref id="B42">
<label>42</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Suchta</surname> <given-names>K</given-names>
</name>
<name>
<surname>Zeber-Lubecka</surname> <given-names>N</given-names>
</name>
<name>
<surname>Grymowicz</surname> <given-names>M</given-names>
</name>
<name>
<surname>Smolarczyk</surname> <given-names>R</given-names>
</name>
<name>
<surname>Kulecka</surname> <given-names>M</given-names>
</name>
<name>
<surname>Hennig</surname> <given-names>EE</given-names>
</name>
</person-group>. <article-title>Autoimmune processes and chronic inflammation as independent risk factors for metabolic complications in women with polycystic ovary syndrome</article-title>. <source>Metabolites</source>. (<year>2025</year>) <volume>15</volume>:<elocation-id>141</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/metabo15030141</pub-id>, PMID: <pub-id pub-id-type="pmid">40137106</pub-id></citation></ref>
<ref id="B43">
<label>43</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Celik</surname> <given-names>MN</given-names>
</name>
<name>
<surname>Yesildemir</surname> <given-names>O</given-names>
</name>
</person-group>. <article-title>Endocrine disruptors in child obesity and related disorders: early critical windows of exposure</article-title>. <source>Curr Nutr Rep</source>. (<year>2025</year>) <volume>14</volume>:<fpage>14</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s13668-024-00604-1</pub-id>, PMID: <pub-id pub-id-type="pmid">39775248</pub-id></citation></ref>
<ref id="B44">
<label>44</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>L</given-names>
</name>
<name>
<surname>Weng</surname> <given-names>S</given-names>
</name>
<name>
<surname>Guo</surname> <given-names>C</given-names>
</name>
<name>
<surname>Dang</surname> <given-names>Q</given-names>
</name>
<name>
<surname>Xu</surname> <given-names>H</given-names>
</name>
<etal/>
</person-group>. <article-title>Machine learning-based integration develops an immune-derived lncRNA signature for improving outcomes in colorectal cancer</article-title>. <source>Nat Commun</source>. (<year>2022</year>) <volume>13</volume>:<fpage>816</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41467-022-28421-6</pub-id>, PMID: <pub-id pub-id-type="pmid">35145098</pub-id></citation></ref>
<ref id="B45">
<label>45</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Xu</surname> <given-names>D</given-names>
</name>
<name>
<surname>Gao</surname> <given-names>J</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>R</given-names>
</name>
<name>
<surname>Yan</surname> <given-names>K</given-names>
</name>
<name>
<surname>Liang</surname> <given-names>H</given-names>
</name>
<etal/>
</person-group>. <article-title>Yang L.Development and validation of a real-time prediction model for acute kidney injury in hospitalized patients</article-title>. <source>Nat Commun</source>. (<year>2025</year>) <volume>16</volume>:<fpage>68</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41467-024-55629-5</pub-id>, PMID: <pub-id pub-id-type="pmid">39747882</pub-id></citation></ref>
<ref id="B46">
<label>46</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Marino</surname> <given-names>L</given-names>
</name>
<name>
<surname>Kim</surname> <given-names>A</given-names>
</name>
<name>
<surname>Ni</surname> <given-names>B</given-names>
</name>
<name>
<surname>Celi</surname> <given-names>FS</given-names>
</name>
</person-group>. <article-title>Thyroid hormone action and liver disease, a complex interplay</article-title>. <source>Hepatology</source>. (<year>2025</year>) <volume>81</volume>:<page-range>651&#x2013;69</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1097/HEP.0000000000000551</pub-id>, PMID: <pub-id pub-id-type="pmid">37535802</pub-id></citation></ref>
</ref-list>
</back>
</article>