<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article article-type="research-article" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Cardiovasc. Med.</journal-id>
<journal-title>Frontiers in Cardiovascular Medicine</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Cardiovasc. Med.</abbrev-journal-title>
<issn pub-type="epub">2297-055X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fcvm.2025.1490961</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Cardiovascular Medicine</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Development and validation of a carotid plaque risk prediction model for coal miners</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" equal-contrib="yes"><name><surname>Li</surname><given-names>Yi-Chun</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<xref ref-type="author-notes" rid="an1"><sup>&#x2020;</sup></xref><uri xlink:href="https://loop.frontiersin.org/people/3052407/overview" /><role content-type="https://credit.niso.org/contributor-roles/investigation/"/><role content-type="https://credit.niso.org/contributor-roles/methodology/"/><role content-type="https://credit.niso.org/contributor-roles/software/"/><role content-type="https://credit.niso.org/contributor-roles/validation/"/><role content-type="https://credit.niso.org/contributor-roles/visualization/"/><role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/><role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/></contrib>
<contrib contrib-type="author" equal-contrib="yes"><name><surname>Zhang</surname><given-names>Tie-Ru</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<xref ref-type="author-notes" rid="an1"><sup>&#x2020;</sup></xref><uri xlink:href="https://loop.frontiersin.org/people/3052499/overview" /><role content-type="https://credit.niso.org/contributor-roles/data-curation/"/><role content-type="https://credit.niso.org/contributor-roles/investigation/"/><role content-type="https://credit.niso.org/contributor-roles/software/"/><role content-type="https://credit.niso.org/contributor-roles/validation/"/><role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/><role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/></contrib>
<contrib contrib-type="author"><name><surname>Zhang</surname><given-names>Fan</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref><uri xlink:href="https://loop.frontiersin.org/people/3052643/overview" /><role content-type="https://credit.niso.org/contributor-roles/data-curation/"/><role content-type="https://credit.niso.org/contributor-roles/investigation/"/><role content-type="https://credit.niso.org/contributor-roles/methodology/"/><role content-type="https://credit.niso.org/contributor-roles/software/"/><role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/></contrib>
<contrib contrib-type="author"><name><surname>Cui</surname><given-names>Chao-Qun</given-names></name><uri xlink:href="https://loop.frontiersin.org/people/3052406/overview" />
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref><role content-type="https://credit.niso.org/contributor-roles/data-curation/"/><role content-type="https://credit.niso.org/contributor-roles/investigation/"/><role content-type="https://credit.niso.org/contributor-roles/methodology/"/><role content-type="https://credit.niso.org/contributor-roles/software/"/><role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/></contrib>
<contrib contrib-type="author"><name><surname>Yang</surname><given-names>Yu-Tong</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref><uri xlink:href="https://loop.frontiersin.org/people/2691095/overview"/><role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/><role content-type="https://credit.niso.org/contributor-roles/data-curation/"/><role content-type="https://credit.niso.org/contributor-roles/investigation/"/><role content-type="https://credit.niso.org/contributor-roles/software/"/><role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/></contrib>
<contrib contrib-type="author"><name><surname>Hao</surname><given-names>Jian-Guang</given-names></name>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref><role content-type="https://credit.niso.org/contributor-roles/data-curation/"/><role content-type="https://credit.niso.org/contributor-roles/investigation/"/><role content-type="https://credit.niso.org/contributor-roles/supervision/"/><role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/></contrib>
<contrib contrib-type="author"><name><surname>Wang</surname><given-names>Jian-Ru</given-names></name>
<xref ref-type="aff" rid="aff5"><sup>5</sup></xref><role content-type="https://credit.niso.org/contributor-roles/data-curation/"/><role content-type="https://credit.niso.org/contributor-roles/investigation/"/><role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/></contrib>
<contrib contrib-type="author"><name><surname>Wu</surname><given-names>Jiao</given-names></name>
<xref ref-type="aff" rid="aff5"><sup>5</sup></xref><role content-type="https://credit.niso.org/contributor-roles/data-curation/"/><role content-type="https://credit.niso.org/contributor-roles/investigation/"/><role content-type="https://credit.niso.org/contributor-roles/software/"/><role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/></contrib>
<contrib contrib-type="author"><name><surname>Gao</surname><given-names>Hai-Wang</given-names></name>
<xref ref-type="aff" rid="aff6"><sup>6</sup></xref><role content-type="https://credit.niso.org/contributor-roles/data-curation/"/><role content-type="https://credit.niso.org/contributor-roles/investigation/"/><role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/></contrib>
<contrib contrib-type="author"><name><surname>Liu</surname><given-names>Ying-Bo</given-names></name>
<xref ref-type="aff" rid="aff6"><sup>6</sup></xref><role content-type="https://credit.niso.org/contributor-roles/data-curation/"/><role content-type="https://credit.niso.org/contributor-roles/investigation/"/><role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/></contrib>
<contrib contrib-type="author" corresp="yes"><name><surname>Luo</surname><given-names>Ming-Zhong</given-names></name>
<xref ref-type="aff" rid="aff7"><sup>7</sup></xref>
<xref ref-type="corresp" rid="cor1">&#x002A;</xref><role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/><role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/><role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/><role content-type="https://credit.niso.org/contributor-roles/project-administration/"/><role content-type="https://credit.niso.org/contributor-roles/resources/"/><role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/></contrib>
<contrib contrib-type="author" corresp="yes"><name><surname>Lei</surname><given-names>Li-Jian</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<xref ref-type="corresp" rid="cor1">&#x002A;</xref><uri xlink:href="https://loop.frontiersin.org/people/2203276/overview" /><role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/><role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/><role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/><role content-type="https://credit.niso.org/contributor-roles/project-administration/"/><role content-type="https://credit.niso.org/contributor-roles/resources/"/><role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/></contrib>
</contrib-group>
<aff id="aff1"><label><sup>1</sup></label><institution>Department of Epidemiology, School of Public Health, Shanxi Medical University</institution>, <addr-line>Taiyuan, Shanxi</addr-line>, <country>China</country></aff>
<aff id="aff2"><label><sup>2</sup></label><institution>MOE Key Laboratory of Coal Environmental Pathogenicity and Prevention, Shanxi Medical University</institution>, <addr-line>Taiyuan, Shanxi</addr-line>, <country>China</country></aff>
<aff id="aff3"><label><sup>3</sup></label><institution>Research Centre of Environmental Pollution and Major Chronic Diseases Epidemiology, Shanxi Medical University</institution>, <addr-line>Taiyuan, Shanxi</addr-line>, <country>China</country></aff>
<aff id="aff4"><label><sup>4</sup></label><institution>Department of Occupational Diseases and Poisoning, The Second People&#x2019;s Hospital of Shanxi Province</institution>, <addr-line>Taiyuan</addr-line>, <country>China</country></aff>
<aff id="aff5"><label><sup>5</sup></label><institution>Department of Medical and Education, The Second People&#x2019;s Hospital of Shanxi Province</institution>, <addr-line>Taiyuan</addr-line>, <country>China</country></aff>
<aff id="aff6"><label><sup>6</sup></label><institution>Peking University Medical Lu&#x0027;an Hospital Health Management Center</institution>, <addr-line>Changzhi, Shanxi</addr-line>, <country>China</country></aff>
<aff id="aff7"><label><sup>7</sup></label><institution>Office of the President, The Second People&#x2019;s Hospital of Shanxi Province</institution>, <addr-line>Taiyuan</addr-line>, <country>China</country></aff>
<author-notes>
<fn fn-type="edited-by"><p><bold>Edited by:</bold> Pasqualino Sirignano, Sapienza University of Rome, Italy</p></fn>
<fn fn-type="edited-by"><p><bold>Reviewed by:</bold> Panagiotis Siogkas, University of Ioannina, Greece</p>
<p>Yufeng Ye, Guangzhou Panyu Central Hospital, China</p>
<p>Gloria Cirelli, Sapienza University of Rome, Italy</p></fn>
<corresp id="cor1"><label>&#x002A;</label><bold>Correspondence:</bold> Ming-Zhong Luo <email>Lmz7344@163.com</email> Li-Jian Lei <email>wwdlijian@sxmu.edu.cn</email></corresp>
<fn fn-type="equal" id="an1"><label><sup>&#x2020;</sup></label><p>These authors have contributed equally to this work</p></fn>
</author-notes>
<pub-date pub-type="epub"><day>09</day><month>05</month><year>2025</year></pub-date>
<pub-date pub-type="collection"><year>2025</year></pub-date>
<volume>12</volume><elocation-id>1490961</elocation-id>
<history>
<date date-type="received"><day>12</day><month>09</month><year>2024</year></date>
<date date-type="accepted"><day>24</day><month>04</month><year>2025</year></date>
</history>
<permissions>
<copyright-statement>&#x00A9; 2025 Li, Zhang, Zhang, Cui, Yang, Hao, Wang, Wu, Gao, Liu, Luo and Lei.</copyright-statement>
<copyright-year>2025</copyright-year><copyright-holder>Li, Zhang, Zhang, Cui, Yang, Hao, Wang, Wu, Gao, Liu, Luo and Lei</copyright-holder><license license-type="open-access" xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="http://creativecommons.org/licenses/by/4.0/">Creative Commons Attribution License (CC BY)</ext-link>. The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p></license>
</permissions>
<abstract><sec><title>Objective</title>
<p>Carotid plaque represents an independent risk factor for cardiovascular disease and a significant threat to human health. The aim of the study is to develop an accurate and interpretable predictive model for early detection the occurrence of carotid plaque.</p>
</sec><sec><title>Methods</title>
<p>A cross-sectional study was conducted by selecting coal miners who participated in medical examinations from October 2021 to January 2022 at a hospital in North China. The features were initially screened using extreme gradient boosting (XGBoost), random forest, and LASSO regression, and the model was subsequently constructed using logistic regression. The three models were then compared, and the optimum model was identified. Finally, a nomogram was plotted to increase its interpretability.</p>
</sec><sec><title>Results</title>
<p>The XGBoost algorithm demonstrated superior performance in feature screening, identifying the top five features as follows: age, systolic blood pressure, low-density lipoprotein cholesterol, white blood cell count, and body mass index (BMI). The area under the curve (AUC), sensitivity, and specificity of the model constructed based on the XGBoost algorithm were 0.846, 0.867, and 0.702, respectively.</p>
</sec><sec><title>Conclusions</title>
<p>It is possible to predict the presence of carotid plaque using machine learning. The model has high application value and can better predict the risk of carotid artery plaque in coal miners. Furthermore, it provides a theoretical basis for the health management of coal miners.</p>
</sec>
</abstract>
<kwd-group>
<kwd>XGBoost</kwd>
<kwd>nomogram</kwd>
<kwd>machine learning</kwd>
<kwd>coal miners</kwd>
<kwd>carotid plaque</kwd>
</kwd-group><contract-num rid="cn001">2021XM43</contract-num><contract-num rid="cn002">CEPPOF202303</contract-num><contract-num rid="cn003">BYBLD002</contract-num><contract-sponsor id="cn001">The &#x201C;Four Batch&#x201D; of Technology-Driven Medical Innovation Plan in Shanxi province, China</contract-sponsor><contract-sponsor id="cn002">Key Laboratory of Coal Environmental Pathogenicity and Prevention (Shanxi Medical University), Ministry of Education, China</contract-sponsor><contract-sponsor id="cn003">Shanxi Province Higher Education &#x201C;Billion Project&#x201D; Science and Technology Guidance Project</contract-sponsor><counts>
<fig-count count="5"/>
<table-count count="2"/><equation-count count="1"/><ref-count count="35"/><page-count count="9"/><word-count count="0"/></counts><custom-meta-wrap><custom-meta><meta-name>section-at-acceptance</meta-name><meta-value>Cardiovascular Epidemiology and Prevention</meta-value></custom-meta></custom-meta-wrap>
</article-meta>
</front>
<body><sec id="s1" sec-type="intro"><label>1</label><title>Introduction</title>
<p>Carotid plaque is an independent risk factor for stroke (<xref ref-type="bibr" rid="B1">1</xref>), coronary heart disease (<xref ref-type="bibr" rid="B2">2</xref>), and atherosclerotic cardiovascular disease (<xref ref-type="bibr" rid="B3">3</xref>). These diseases are the major cause of disability and death globally (<xref ref-type="bibr" rid="B4">4</xref>, <xref ref-type="bibr" rid="B5">5</xref>), and they pose a serious economic burden in both developed and developing countries (<xref ref-type="bibr" rid="B6">6</xref>). A study has shown that the prevalence of carotid plaque in the middle-aged and elderly population in China is 60.3&#x0025; (<xref ref-type="bibr" rid="B7">7</xref>). As the population of China continues to age and urbanize, the prevalence of cardiovascular and cerebrovascular diseases is expected to increase (<xref ref-type="bibr" rid="B8">8</xref>). In some research, occupational stress is identified as a risk factor for cardiovascular disease, with the potential for atherosclerosis to develop as a result of long-term occupational stress (<xref ref-type="bibr" rid="B9">9</xref>). China is the world&#x0027;s largest coal producer, with 95&#x0025; of its coal sourced from underground mining (<xref ref-type="bibr" rid="B10">10</xref>), which employs over six million workers (<xref ref-type="bibr" rid="B11">11</xref>). In comparison to the general population, coal miners are exposed to a number of harmful factors, including dust (<xref ref-type="bibr" rid="B12">12</xref>) and shift work (<xref ref-type="bibr" rid="B13">13</xref>). Additionally, they tend to engage in a range of adverse lifestyle habits, such as smoking (<xref ref-type="bibr" rid="B14">14</xref>)and alcohol consumption, which can increase the likelihood of developing carotid plaques. Therefore, it is crucial to implement early screening and intervention strategies for coal miners to delay the occurrence and progression of carotid plaque. The majority of studies to date have focused on disease risk in the general population (<xref ref-type="bibr" rid="B15">15</xref>, <xref ref-type="bibr" rid="B16">16</xref>), with fewer studies investigating the prediction of disease risk in coal miners.</p>
<p>Predictive models can estimate the probability or risk of an outcome using the characteristics of an individual (<xref ref-type="bibr" rid="B17">17</xref>), which is called a diagnostic model. Diagnostic models are of crucial significance in healthcare. They reduce testing costs, enhance the accuracy, efficiency and objectivity of decision-making. They facilitate clinicians in diagnosing and treating patients more effectively, thereby improving the quality of healthcare and the patient care experience.</p>
<p>This study used extreme gradient boosting (XGBoost), random forests, and LASSO regression to filter features for predicting carotid plaque risk in coal miners. Then, logistic regression was applied to create a simple practical risk prediction model to identify at-risk individuals.</p>
</sec>
<sec id="s2"><label>2</label><title>Material and methods</title>
<sec id="s2a"><label>2.1</label><title>Data sources and subjects</title>
<p>Data were retrospectively collected from coal miners who attended physical examinations at a hospital in North China between October 2021 and January 2022. After excluding incomplete data recorders, attendees younger than 18 years or older than 60 years, and participants with cardiovascular disease, 2,956 participants were included in the study for the prediction model.</p>
</sec>
<sec id="s2b"><label>2.2</label><title>Ethical approval</title>
<p>All procedures were approved by the Research Ethics Committee of the Second People&#x0027;s Hospital of Shanxi Province and were conducted strictly in accordance with internationally recognized ethical standards for human research. All participants in this survey were aware of the research contents and precautions and participated voluntarily.</p>
</sec>
<sec id="s2c"><label>2.2</label><title>Potential predictors and case definition</title>
<p>A review of the pertinent literature on carotid plaque and an analysis of the accessibility of predictors led to the identification of 27 potential factors: (1) Demographic characteristics: gender, age; (2) Physical examination indicators: height (HT), weight (WT), body mass index (BMI), systolic blood pressure (SBP), diastolic blood pressure (DBP); (3) Laboratory tests: total cholesterol (TC),triglycerides (TG), high-density lipoprotein cholesterol (HDL-C), low-density lipoprotein cholesterol (LDL-C), fasting blood glucose (FBG), alanine aminotransferase (ALT), aspartate aminotransferase (AST), direct bilirubin (DBIL), total bilirubin (TBIL), alkaline phosphatase (ALP), uric acid (UA), platelet count (PLT), white blood cell count (WBC), creatinine (CRE); (4) Lifestyle habits: smoking, alcohol consumption; (5) Occupational factors: years of working experience, exposure to dust (rock dust and coal dust), exposure to hazardous gases (carbon monoxide and hydrogen sulfide); (6) Other indicators: fatty liver disease (FLD).</p>
<p>Cases were defined as whether participants were diagnosed with carotid plaque by carotid ultrasound. The diameters and IMT of the distal common carotid artery, the carotid bulb, and the proximal internal carotid artery were measured within 1&#x2013;1.5 cm below the level of the bifurcation of the participant&#x0027;s internal and external carotid arteries by an experienced physician to observe the presence of atherosclerotic plaque.</p>
</sec>
<sec id="s2d"><label>2.3</label><title>Data processing and predictive modelling</title>
<p>To make full use of the data and evaluate the model&#x0027;s performance, we first randomly divided the dataset into a training set (70&#x0025;) and a test set (30&#x0025;), which were used for model training. To ensure the robustness and generalizability of our model, all the data in the training set were utilized in ten-fold cross-validation for model training.</p>
<p>The statistical analyses in this study were conducted using IBM SPSS 26.0. The data, which exhibited a normal distribution, were expressed as &#x201C;&#x0060;x&#x2009;&#x00B1;&#x2009;s&#x201D;, and t-tests were employed for comparisons between groups. The data, which did not exhibit a normal distribution, were expressed as &#x201C;[M (P<sub>25</sub>, P<sub>75</sub>)]&#x201D;, and rank-sum tests were employed for comparisons between groups. The data for categorical variables were expressed as percentages, and the Pearson <italic>&#x03C7;</italic><sup>2</sup> test was employed for comparisons between groups. The level of the test was set at <italic>&#x03B1;</italic>&#x2009;&#x003D;&#x2009;0.05 in this paper. R4.2.3 was employed for the purpose of feature screening, model construction, the generation of nomograms, and the assessment of the effects.</p>
<p>XGBoost, random forest, and LASSO regression were used to select the features from the training set as input variables, and the incidence of carotid artery plaque as the output variable to construct a logistic regression model. Considering the potential multicollinearity among different variables, which may lead to model instability, the study evaluated the features selected by three machine learning algorithms based on correlation statistical charts as part of model selection. The performance of the three models was compared by the area under the ROC curve (AUC), net reclassification index (NRI), and integrated discriminant improvement index (IDI), and ultimately selected the model with the best performance. Subsequently, the optimal model was used to construct a nomogram, which was evaluated using decision curves (DCA) and clinical impact curves (ICI).</p>
</sec>
</sec>
<sec id="s3" sec-type="results"><label>3</label><title>Results</title>
<sec id="s3a"><label>3.1</label><title>Basic characteristics of the study object</title>
<p>A total of 2,956 individuals were included in this study, with a prevalence of carotid plaque of 10.52&#x0025;. Patients who developed carotid plaque were older and had a higher prevalence in men compared to the no carotid plaque group. They also had higher BMI, systolic blood pressure, diastolic blood pressure, total cholesterol, triglycerides, LDL cholesterol, fasting blood glucose, alkaline phosphatase, white blood cell count, creatinine, years of working experience, a higher prevalence of fatty liver disease, and higher rates of alcohol and smoking. The statistical analysis revealed that there were significant differences in the predictors between healthy individuals and patients with carotid plaque (<xref ref-type="table" rid="T1">Table&#x00A0;1</xref>). Following the random allocation of the data, a total of 2,069 individuals were included in the training set, with a prevalence of carotid plaque of 10.54&#x0025; (<xref ref-type="sec" rid="s11">Supplementary Table S1</xref>), and a total of 887 individuals were included in the test set, with a prevalence of carotid plaque of 10.48&#x0025; (<xref ref-type="sec" rid="s11">Supplementary Table S2</xref>).</p>
<table-wrap id="T1" position="float"><label>Table 1</label>
<caption><p>Basic characteristics of the study population.</p></caption>
<table frame="hsides" rules="groups">
<colgroup>
<col align="left"/>
<col align="center"/>
<col align="center"/>
<col align="center"/>
</colgroup>
<thead>
<tr>
<th valign="top" align="left" rowspan="2">Characteristic</th>
<th valign="top" align="center" colspan="2">Carotid plaque</th>
<th valign="top" align="center" rowspan="2"><italic>P</italic> value</th>
</tr>
<tr>
<th valign="top" align="center">Yes (<italic>n</italic>&#x2009;&#x003D;&#x2009;311)</th>
<th valign="top" align="center">No (<italic>n</italic>&#x2009;&#x003D;&#x2009;2,645)</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left" colspan="3">Sex, <italic>n</italic> (&#x0025;)</td>
<td valign="top" align="center" colspan="1">&#x003C;0.001</td>
</tr>
<tr>
<td valign="top" align="left">Female</td>
<td valign="top" align="center">34 (10.9&#x0025;)</td>
<td valign="top" align="center">744 (28.1&#x0025;)</td>
<td valign="top" align="center"/>
</tr>
<tr>
<td valign="top" align="left">Male</td>
<td valign="top" align="center">277 (89.1&#x0025;)</td>
<td valign="top" align="center">1,901 (71.9&#x0025;)</td>
<td valign="top" align="center"/>
</tr>
<tr>
<td valign="top" align="left">Age (years), (mean&#x2009;&#x00B1;&#x2009;SD)</td>
<td valign="top" align="center">47.5&#x2009;&#x00B1;&#x2009;6.53</td>
<td valign="top" align="center">38.6&#x2009;&#x00B1;&#x2009;7.73</td>
<td valign="top" align="center">&#x003C;0.001</td>
</tr>
<tr>
<td valign="top" align="left">HT (cm), median (IQR)</td>
<td valign="top" align="center">169.50 (164.90&#x2013;174.00)</td>
<td valign="top" align="center">170.10 (164.40&#x2013;175.10)</td>
<td valign="top" align="center">0.774</td>
</tr>
<tr>
<td valign="top" align="left">WT (kg), median (IQR)</td>
<td valign="top" align="center">76.00 (68.20&#x2013;83.00)</td>
<td valign="top" align="center">17.70 (64.80&#x2013;82.40)</td>
<td valign="top" align="center">0.004</td>
</tr>
<tr>
<td valign="top" align="left">BMI (kg/m<sup>2</sup>), median (IQR)</td>
<td valign="top" align="center">26.34 (24.41&#x2013;28.36)</td>
<td valign="top" align="center">25.52 (23.21&#x2013;27.82)</td>
<td valign="top" align="center">&#x003C;0.001</td>
</tr>
<tr>
<td valign="top" align="left">SBP (mm/Hg), mean (SD)</td>
<td valign="top" align="center">143.00 (19.10)</td>
<td valign="top" align="center">132.00 (16.60)</td>
<td valign="top" align="center">&#x003C;0.001</td>
</tr>
<tr>
<td valign="top" align="left">DBP (mm/Hg), mean (SD)</td>
<td valign="top" align="center">86.00 (13.40)</td>
<td valign="top" align="center">78.70 (11.70)</td>
<td valign="top" align="center">&#x003C;0.001</td>
</tr>
<tr>
<td valign="top" align="left">TC (mmol/L), median (IQR)</td>
<td valign="top" align="center">4.71 (4.15&#x2013;5.27)</td>
<td valign="top" align="center">4.37 (3.85&#x2013;4.92)</td>
<td valign="top" align="center">&#x003C;0.001</td>
</tr>
<tr>
<td valign="top" align="left">TG (mmol/L), mean (SD)</td>
<td valign="top" align="center">1.96 (1.33)</td>
<td valign="top" align="center">1.74 (1.22)</td>
<td valign="top" align="center">0.006</td>
</tr>
<tr>
<td valign="top" align="left">HDL-C (mmol/L), mean (SD)</td>
<td valign="top" align="center">1.20 (0.31)</td>
<td valign="top" align="center">1.23 (0.30)</td>
<td valign="top" align="center">0.077</td>
</tr>
<tr>
<td valign="top" align="left">LDL-C (mmol/L), median (IQR)</td>
<td valign="top" align="center">3.02 (2.60&#x2013;3.56)</td>
<td valign="top" align="center">2.73 (2.25&#x2013;3.23)</td>
<td valign="top" align="center">&#x003C;0.001</td>
</tr>
<tr>
<td valign="top" align="left">FBG (mmol/L), mean (SD)</td>
<td valign="top" align="center">5.86 (1.56)</td>
<td valign="top" align="center">5.41 (1.07)</td>
<td valign="top" align="center">&#x003C;0.001</td>
</tr>
<tr>
<td valign="top" align="left">ALT (U/L), mean (SD)</td>
<td valign="top" align="center">26.80 (16.80)</td>
<td valign="top" align="center">25.8 (19.4)</td>
<td valign="top" align="center">0.324</td>
</tr>
<tr>
<td valign="top" align="left">AST (U/L), mean (SD)</td>
<td valign="top" align="center">22.20 (9.78)</td>
<td valign="top" align="center">20.7 (9.25)</td>
<td valign="top" align="center">0.013</td>
</tr>
<tr>
<td valign="top" align="left">DBIL (&#x00B5;mol/L), mean (SD)</td>
<td valign="top" align="center">5.06 (1.80)</td>
<td valign="top" align="center">5.09 (1.96)</td>
<td valign="top" align="center">0.812</td>
</tr>
<tr>
<td valign="top" align="left">TBIL (&#x00B5;mol/L), mean (SD)</td>
<td valign="top" align="center">12.50 (5.51)</td>
<td valign="top" align="center">12.60 (6.16)</td>
<td valign="top" align="center">0.626</td>
</tr>
<tr>
<td valign="top" align="left">ALP (U/L), mean (SD)</td>
<td valign="top" align="center">87.90 (23.10)</td>
<td valign="top" align="center">81.50 (22.50)</td>
<td valign="top" align="center">&#x003C;0.001</td>
</tr>
<tr>
<td valign="top" align="left">UA (&#x00B5;mol/L), median (IQR)</td>
<td valign="top" align="center">324.00 (267.00&#x2013;385.00)</td>
<td valign="top" align="center">314.00 (259.00&#x2013;378.00)</td>
<td valign="top" align="center">0.208</td>
</tr>
<tr>
<td valign="top" align="left">PLT (10<sup>9</sup>/L), median (IQR)</td>
<td valign="top" align="center">242.00 (210.00&#x2013;288.00)</td>
<td valign="top" align="center">254.00 (216.00&#x2013;296.00)</td>
<td valign="top" align="center">0.046</td>
</tr>
<tr>
<td valign="top" align="left">WBC (10<sup>9</sup>/L), mean (SD)</td>
<td valign="top" align="center">7.88 (2.06)</td>
<td valign="top" align="center">7.36 (1,96)</td>
<td valign="top" align="center">&#x003C;0.001</td>
</tr>
<tr>
<td valign="top" align="left">CRE (&#x00B5;mol/L), mean (SD)</td>
<td valign="top" align="center">75.00 (11.60)</td>
<td valign="top" align="center">72.00 (14.20)</td>
<td valign="top" align="center">&#x003C;0.001</td>
</tr>
<tr>
<td valign="top" align="left" colspan="3">FLD, <italic>n</italic> (&#x0025;)</td>
<td valign="top" align="center" colspan="1">&#x003C;0.001</td>
</tr>
<tr>
<td valign="top" align="left">Yes</td>
<td valign="top" align="center">146 (46.9&#x0025;)</td>
<td valign="top" align="center">888 (33.6&#x0025;)</td>
<td valign="top" align="center"/>
</tr>
<tr>
<td valign="top" align="left">No</td>
<td valign="top" align="center">165 (53.1&#x0025;)</td>
<td valign="top" align="center">1,757 (66.4&#x0025;)</td>
<td valign="top" align="center"/>
</tr>
<tr>
<td valign="top" align="left" colspan="3">Years of working (years), <italic>n</italic> (&#x0025;)</td>
<td valign="top" align="center" colspan="1">&#x003C;0.001</td>
</tr>
<tr>
<td valign="top" align="left">1&#x2013;10</td>
<td valign="top" align="center">23 (7.4&#x0025;)</td>
<td valign="top" align="center">874 (33.0&#x0025;)</td>
<td valign="top" align="center"/>
</tr>
<tr>
<td valign="top" align="left">11&#x2013;20</td>
<td valign="top" align="center">120 (38.6&#x0025;)</td>
<td valign="top" align="center">1,217 (46.0&#x0025;)</td>
<td valign="top" align="center"/>
</tr>
<tr>
<td valign="top" align="left">&#x2265;21</td>
<td valign="top" align="center">168 (54.0&#x0025;)</td>
<td valign="top" align="center">554 (20.9&#x0025;)</td>
<td valign="top" align="center"/>
</tr>
<tr>
<td valign="top" align="left" colspan="3">Dust exposure, <italic>n</italic> (&#x0025;)</td>
<td valign="top" align="center" colspan="1">0.471</td>
</tr>
<tr>
<td valign="top" align="left">Yes</td>
<td valign="top" align="center">170 (54.7&#x0025;)</td>
<td valign="top" align="center">1,384 (52.3&#x0025;)</td>
<td valign="top" align="center"/>
</tr>
<tr>
<td valign="top" align="left">No</td>
<td valign="top" align="center">141 (45.3&#x0025;)</td>
<td valign="top" align="center">1,261 (47.7&#x0025;)</td>
<td valign="top" align="center"/>
</tr>
<tr>
<td valign="top" align="left" colspan="3">Harmful gas exposure, <italic>n</italic> (&#x0025;)</td>
<td valign="top" align="center" colspan="1">0.589</td>
</tr>
<tr>
<td valign="top" align="left">Yes</td>
<td valign="top" align="center">86 (27.7&#x0025;)</td>
<td valign="top" align="center">689 (26.0&#x0025;)</td>
<td valign="top" align="center"/>
</tr>
<tr>
<td valign="top" align="left">No</td>
<td valign="top" align="center">225 (72.3&#x0025;)</td>
<td valign="top" align="center">1,956 (74.0&#x0025;)</td>
<td valign="top" align="center"/>
</tr>
<tr>
<td valign="top" align="left" colspan="3">Alcohol drinking, <italic>n</italic> (&#x0025;)</td>
<td valign="top" align="center" colspan="1">&#x003C;0.001</td>
</tr>
<tr>
<td valign="top" align="left">Yes</td>
<td valign="top" align="center">132 (42.4&#x0025;)</td>
<td valign="top" align="center">792 (29.9&#x0025;)</td>
<td valign="top" align="center"/>
</tr>
<tr>
<td valign="top" align="left">No</td>
<td valign="top" align="center">179 (57.6&#x0025;)</td>
<td valign="top" align="center">1,853 (70.1&#x0025;)</td>
<td valign="top" align="center"/>
</tr>
<tr>
<td valign="top" align="left" colspan="3">Smoke, <italic>n</italic> (&#x0025;)</td>
<td valign="top" align="center" colspan="1">&#x003C;0.001</td>
</tr>
<tr>
<td valign="top" align="left">Yes</td>
<td valign="top" align="center">185 (59.5&#x0025;)</td>
<td valign="top" align="center">978 (37.0&#x0025;)</td>
<td valign="top" align="center"/>
</tr>
<tr>
<td valign="top" align="left">No</td>
<td valign="top" align="center">126 (40.5&#x0025;)</td>
<td valign="top" align="center">1,667 (63.0&#x0025;)</td>
<td valign="top" align="center"/>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn id="table-fn1"><p>HT, height; WT, weight; SBP, systolic blood pressure; DBP, diastolic blood pressure; TC, total cholesterol; TG, triglyceride; HDL-C, high-density lipoprotein cholesterol; LDL-C, low-density lipoprotein cholesterol; FBG, fasting blood glucose; ALT, alanine transaminase; AST, aspartate aminotransferase; DBIL, direct bilirubin; TBIL, total bilirubin; ALP, alkaline phosphatase; UA, uric acid; PLT, blood platelet count; WBC, white blood cell count; CRE, creatinine; FLD, fatty liver disease; Exposure to rock dust and coal dust; Exposure to carbon monoxide and sulfur dioxide.</p></fn>
</table-wrap-foot>
</table-wrap>
</sec>
<sec id="s3b"><label>3.2</label><title>Screening of features</title>
<p>The correlation statistics chart in the training set demonstrates a robust correlation between the selected features (<xref ref-type="sec" rid="s11">Supplementary Figure S1</xref>). Consequently, three machine learning algorithms were selected to filter the features and subsequently construct the prediction model.</p>
<p>In the XGBoost algorithm, the hyperparameters of the model are selected through cross-validation and random search. The optimal number of iterations of the model is obtained by monitoring the number of iterations of the model using the test data, thereby preventing overfitting (<xref ref-type="sec" rid="s11">Supplementary Figure S2</xref>). The optimal number of iterations and the optimal hyperparameters of the model were then incorporated into the model. The relative importance of the features was determined by training the model on the training set. Features with the highest feature importance were extracted and plotted on a bar graph (<xref ref-type="sec" rid="s11">Supplementary Figure S3</xref>). The five most important features were selected for the next step of model construction, and the resulting prediction model was named the &#x201C;XGBoost model&#x201D;.</p>
<p>In the random forest model, the minimum mean squared error and the Gini coefficient are employed as the pivotal hyperparameters in the training set to filter the features. The relative importance of the features is then plotted (only the top ten features are plotted, <xref ref-type="sec" rid="s11">Supplementary Figure S4</xref>). Subsequently, the intersection of the top ten features is taken as the input variable for logistic regression analysis, and the constructed prediction model is designated as the &#x201C;RF model&#x201D;.</p>
<p>Finally, LASSO regression was employed to identify the most pertinent features. In the LASSO regression model, the value of <italic>&#x03BB;</italic> was selected through cross-validation, and the maximum penalty parameter <italic>&#x03BB;</italic> with the lowest mean square error within one standard deviation was ultimately selected (<xref ref-type="sec" rid="s11">Supplementary Figure S5</xref>). A total of five meaningful variables were obtained under this <italic>&#x03BB;</italic> for the subsequent model construction, and the constructed predictive model was designated as the &#x201C;LASSO model&#x201D;.</p>
</sec>
<sec id="s3c"><label>3.3</label><title>Construction and evaluation of the model</title>
<p>Logistic regression models were constructed using features selected by XGBoost, Random Forest and LASSO regression, respectively. The data from the training and test sets were incorporated into the three models to generate their respective ROC curves (<xref ref-type="fig" rid="F1">Figure&#x00A0;1</xref>). The AUCs of the three models in the training set are 0.846, 0.846 and 0.852, respectively. The AUCs of the three models in the test set are 0.817, 0.815 and 0.817, respectively. The AUCs of the &#x201C;LASSO model&#x201D; in the training and test sets are higher than those of the other models, although the differences are relatively minor.</p>
<fig id="F1" position="float"><label>Figure 1</label>
<caption><p>Presents the receiver operating characteristic (ROC) curves for the three models analyzed in the training <bold>(A)</bold> and test <bold>(B)</bold> sets.</p></caption>
<graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="fcvm-12-1490961-g001.tif"/>
</fig>
<p>The accuracy of the three models in the training cohort and test sets was evaluated by the net reclassification index (NRI) and the integrated discrimination improvement index (IDI), respectively (<xref ref-type="table" rid="T2">Table&#x00A0;2</xref>). It can be seen that the accuracy of &#x201C;XGBoost model&#x201D; is slightly better than the other models. There was a strong correlation between the characteristics of &#x201C;RF model&#x201D; and &#x201C;LASSO model&#x201D;, including systolic blood pressure (SBP) and diastolic blood pressure (DBP), total cholesterol (TC) and low-density lipoprotein cholesterol (LDL-C) (<xref ref-type="sec" rid="s11">Supplementary Figure S1</xref>). The inclusion of variables with strong correlations in a predictive model can lead to an increase in the variance of parameter estimates, which in turn reduces predictive accuracy. In severe cases, anomalies may occur in which the predictive model does not reflect the relationship between the input and output variables, but rather their joint influence on the output variables. Therefore, the &#x201C;XGBoost model&#x201D; is chosen as the final model in this study, and the formula of the model is shown below:<disp-formula><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="UDM1"><mml:mi>P</mml:mi><mml:mo>=</mml:mo><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mfrac><mml:mrow><mml:msup><mml:mi>e</mml:mi><mml:mrow><mml:mo>&#x2212;</mml:mo><mml:mn>13.5554</mml:mn><mml:mo>+</mml:mo><mml:mn>0.1544</mml:mn><mml:mo>&#x00D7;</mml:mo><mml:mrow><mml:mi mathvariant="normal">Age</mml:mi></mml:mrow><mml:mo>+</mml:mo><mml:mn>0.0349</mml:mn><mml:mo>&#x00D7;</mml:mo><mml:mrow><mml:mi mathvariant="normal">DBP</mml:mi></mml:mrow><mml:mo>+</mml:mo><mml:mn>0.3557</mml:mn><mml:mo>&#x00D7;</mml:mo><mml:mrow><mml:mi mathvariant="normal">HDL</mml:mi></mml:mrow><mml:mo>&#x2212;</mml:mo><mml:mi>C</mml:mi><mml:mo>+</mml:mo><mml:mn>0.0754</mml:mn><mml:mo>&#x00D7;</mml:mo><mml:mrow><mml:mi mathvariant="normal">WBC</mml:mi></mml:mrow><mml:mo>+</mml:mo><mml:mn>0.0092</mml:mn><mml:mo>&#x00D7;</mml:mo><mml:mrow><mml:mi mathvariant="normal">BMI</mml:mi></mml:mrow></mml:mrow></mml:msup></mml:mrow><mml:mrow><mml:mn>1</mml:mn><mml:mo>+</mml:mo><mml:msup><mml:mi>e</mml:mi><mml:mrow><mml:mo>&#x2212;</mml:mo><mml:mn>13.5554</mml:mn><mml:mo>+</mml:mo><mml:mn>0.1544</mml:mn><mml:mo>&#x00D7;</mml:mo><mml:mrow><mml:mi mathvariant="normal">Age</mml:mi></mml:mrow><mml:mo>+</mml:mo><mml:mn>0.0349</mml:mn><mml:mo>&#x00D7;</mml:mo><mml:mrow><mml:mi mathvariant="normal">DBP</mml:mi></mml:mrow><mml:mo>+</mml:mo><mml:mn>0.3557</mml:mn><mml:mo>&#x00D7;</mml:mo><mml:mrow><mml:mi mathvariant="normal">HDL</mml:mi></mml:mrow><mml:mo>&#x2212;</mml:mo><mml:mi>C</mml:mi><mml:mo>+</mml:mo><mml:mn>0.0754</mml:mn><mml:mo>&#x00D7;</mml:mo><mml:mrow><mml:mi mathvariant="normal">WBC</mml:mi></mml:mrow><mml:mo>+</mml:mo><mml:mn>0.0092</mml:mn><mml:mo>&#x00D7;</mml:mo><mml:mrow><mml:mi mathvariant="normal">BMI</mml:mi></mml:mrow></mml:mrow></mml:msup></mml:mrow></mml:mfrac></mml:mrow></mml:mstyle></mml:math></disp-formula></p>
<table-wrap id="T2" position="float"><label>Table 2</label>
<caption><p>Presents an assessment of the accuracy of the model, as measured by the Net Reclassification Index (NRI) and the Integrated Discriminant Improvement Index (IDI).</p></caption>
<table frame="hsides" rules="groups">
<colgroup>
<col align="left"/>
<col align="center"/>
<col align="center"/>
<col align="center"/>
<col align="center"/>
</colgroup>
<thead>
<tr>
<th valign="top" align="left">Comparison model</th>
<th valign="top" align="center">NRI</th>
<th valign="top" align="center"><italic>P</italic> value</th>
<th valign="top" align="center">IDI</th>
<th valign="top" align="center"><italic>P</italic> value</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left" colspan="5">Training set</td>
</tr>
<tr>
<td valign="top" align="left">XGB model vs. RF model</td>
<td valign="top" align="center">&#x2212;0.001</td>
<td valign="top" align="center">0.939</td>
<td valign="top" align="center">0.027</td>
<td valign="top" align="center">0.211</td>
</tr>
<tr>
<td valign="top" align="left">XGB model vs. LASSO model</td>
<td valign="top" align="center">0.004</td>
<td valign="top" align="center">0.803</td>
<td valign="top" align="center">0.001</td>
<td valign="top" align="center">0.948</td>
</tr>
<tr>
<td valign="top" align="left">RF model vs. LASSO model</td>
<td valign="top" align="center">0.006</td>
<td valign="top" align="center">0.752</td>
<td valign="top" align="center">&#x2212;0.026</td>
<td valign="top" align="center">0.461</td>
</tr>
<tr>
<td valign="top" align="left" colspan="5">Test set</td>
</tr>
<tr>
<td valign="top" align="left">XGB model vs. RF model</td>
<td valign="top" align="center">0</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">0.015</td>
<td valign="top" align="center">0.599</td>
</tr>
<tr>
<td valign="top" align="left">XGB model vs. LASSO model</td>
<td valign="top" align="center">0.021</td>
<td valign="top" align="center">0.461</td>
<td valign="top" align="center">0</td>
<td valign="top" align="center">1</td>
</tr>
<tr>
<td valign="top" align="left">RF model vs. LASSO model</td>
<td valign="top" align="center">0.021</td>
<td valign="top" align="center">0.461</td>
<td valign="top" align="center">0.041</td>
<td valign="top" align="center">0.595</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>A forest plot was constructed based on the characteristics of the &#x201C;XGBoost model&#x201D; (<xref ref-type="fig" rid="F2">Figure&#x00A0;2</xref>). It was found that age, diastolic blood pressure (DBP), low-density lipoprotein cholesterol (LDL-C), and white blood cell count (WBC) were the risk factors for carotid artery plaques among coal miners, with odds ratios (ORs) greater than 1 and statistically significant differences.</p>
<fig id="F2" position="float"><label>Figure 2</label>
<caption><p>Presents the construction of a forest plot based on the features of the &#x201C;XGBoost model&#x201D;.</p></caption>
<graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="fcvm-12-1490961-g002.tif"/>
</fig>
</sec>
<sec id="s3d"><label>3.4</label><title>Visualization of the prediction model and evaluation of its effectiveness</title>
<p>A nomogram was constructed using the features from the XGBoost model to assess the risk of carotid plaque in miners (<xref ref-type="fig" rid="F3">Figure&#x00A0;3A</xref>). Using the first sample in the training set as an example, a nomogram was created to locate the risk score for age (<xref ref-type="fig" rid="F3">Figure&#x00A0;3B</xref>). A straight line was drawn vertically on the &#x201C;scores&#x201D; axis to determine how many scores correlate with the risk for age. This process is repeated for each trait, with the sum placed on the &#x201C;total points&#x201D; axis. Finally, a straight line is drawn vertically down to give the risk of carotid plaque in miners.</p>
<fig id="F3" position="float"><label>Figure 3</label>
<caption><p>Nomogram for predicting carotid artery plaque in miners. The blue areas in the plots indicate the distribution of variables in each feature. <bold>(A)</bold> Nomogram constructed based on the data in the training set; <bold>(B)</bold> Case nomogram plotted using the first sample in the training set as an example.</p></caption>
<graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="fcvm-12-1490961-g003.tif"/>
</fig>
<p>In parallel, the decision curve analysis (DCA) and clinical impact curve (CIC) of the nomogram were plotted on the training and test sets. The prevalence of carotid plaque in miners was found to be approximately 13.06&#x0025; in the previous study, thus serving as the baseline prevalence of carotid plaque in miners to plot the DCA and CIC. The analysis of the decision curves revealed that the threshold range of the nomogram in the training set was 0.02&#x2013;0.40, with the highest net gain of 0.88 (<xref ref-type="fig" rid="F4">Figure&#x00A0;4A</xref>). In the test set, the threshold range was 0.03&#x2013;0.42, with the highest net gain of 0.82 (<xref ref-type="fig" rid="F4">Figure&#x00A0;4B</xref>). The results of the DCA were used to plot clinical impact curves, which were employed to assess the clinical utility of the nomogram. The results of the clinical impact curves demonstrated that the predicted probabilities were in good agreement with the actual probabilities (<xref ref-type="fig" rid="F5">Figure&#x00A0;5A</xref>), and similar results were obtained in the test set (<xref ref-type="fig" rid="F5">Figure&#x00A0;5B</xref>).</p>
<fig id="F4" position="float"><label>Figure 4</label>
<caption><p>Presents the decision curve analysis of the nomogram in the training set <bold>(A)</bold> and the test set <bold>(B)</bold> the horizontal coordinates represent the probability thresholds. The line labeled &#x201C;None&#x201D; indicates the net clinical gain curve if all patients are not intervened. The line labeled &#x201C;All&#x201D; is the net clinical gain curve if all patients are intervened. The red line represents the net benefit curve for &#x201C;treating&#x201D; patients within each prediction threshold in the training (or test) set. The bottom horizontal line represents the loss: benefit ratio, which represents the proportion of loss and benefit at different probability thresholds.</p></caption>
<graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="fcvm-12-1490961-g004.tif"/>
</fig>
<fig id="F5" position="float"><label>Figure 5</label>
<caption><p>Presents the clinical impact curve analysis of the nomogram in the training set <bold>(A)</bold> and test set <bold>(B)</bold> the horizontal coordinates represent the probability thresholds, while the vertical coordinates indicate the number of individuals. The red line illustrates the number of individuals predicted by the model to be at high risk at different probability thresholds, while the blue line depicts the number of individuals predicted to be at high risk who actually experienced an outcome event at different probability thresholds. The bottom horizontal line represents the loss: gain ratio, which indicates the proportion of losses and gains at different probability thresholds.</p></caption>
<graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="fcvm-12-1490961-g005.tif"/>
</fig>
</sec>
</sec>
<sec id="s4" sec-type="discussion"><label>4</label><title>Discussion</title>
<p>In this study, a predictive model was developed to predict the risk of carotid plaque in coal miners. Three machine learning algorithms were employed to filter the features, and based on the filtered features, a predictive model was constructed using logistic regression. Following the comparison of the three models, the XGBoost model was identified as the most effective, with an AUC, sensitivity and specificity of 0.846, 0.867 and 0.702, respectively. This may be attributed to the XGBoost approach, which combines the prediction results of multiple weak learners (decision trees) to construct a more effective model, ultimately improving overall performance. Furthermore, XGBoost employs early &#x201C;stops&#x201D; to prevent overfitting, thereby enhancing its generalizability. Finally, a nomogram has been constructed based on the features of the &#x201C;XGB model&#x201D;, facilitating the prediction probability of individual samples.</p>
<p>In comparison to other studies, our research team developed a carotid plaque risk prediction model that applies to coal miners. This model included a greater number of characteristics (<xref ref-type="bibr" rid="B18">18</xref>, <xref ref-type="bibr" rid="B19">19</xref>), such as years of work experience, dust exposure, exposure to hazardous gases, and lifestyle habits. All of these characteristics are relevant to miners, and although they were not included in the final prediction model, the differences between healthy individuals and patients with carotid plaques were statistically significant. This suggests that these characteristics may provide food for thought for future studies. Xie et al. identified a significant association between air pollution and carotid plaque using a COX proportional risk model (<xref ref-type="bibr" rid="B12">12</xref>), whereas other studies did not include this feature. Coal miners are often exposed to hazardous gases such as dust, carbon monoxide and hydrogen sulphide. Sugiura et al. employed multivariate logistic regression to ascertain an association between unhealthy lifestyle habits, such as habitual smoking, and atherosclerosis (<xref ref-type="bibr" rid="B14">14</xref>); other studies did not adjust for lifestyle characteristics.</p>
<p>The predicted probabilities of the three prediction models exhibited minimal discrepancy (the difference between the predictions was not statistically significant). We identified the features that appeared twice in the three models as the most crucial features, which were age, systolic blood pressure, diastolic blood pressure, total cholesterol and low-density lipoprotein cholesterol. Among these, age, as the most crucial feature, demonstrated a robust correlation in all three models, which is consistent with previous findings (<xref ref-type="bibr" rid="B20">20</xref>). Hypertension has been demonstrated to elevate the risk of carotid plaque formation, a finding consistent with our own observations (<xref ref-type="bibr" rid="B21">21</xref>, <xref ref-type="bibr" rid="B22">22</xref>). However, a study conducted in a middle-aged and elderly population indicated that systolic and diastolic blood pressure exert distinct effects on carotid plaque, with one being a risk factor for plaque development and the other a protective factor (<xref ref-type="bibr" rid="B23">23</xref>). This is contrary to the previously held view that systolic blood pressure is a risk factor for carotid plaque formation. This discrepancy may be attributed to the fact that systolic blood pressure tends to increase with age (<xref ref-type="bibr" rid="B24">24</xref>), while diastolic blood pressure tends to decrease (<xref ref-type="bibr" rid="B25">25</xref>), which is considered a protective factor. In contrast, the present study&#x0027;s main population consisted of miners undergoing a physical examination, who were considerably younger and in better physical condition. The relationship between diastolic blood pressure and carotid plaque remains unknown. Our findings may provide insight into this relationship. Additionally, our study found that elevated blood lipids (e.g., total cholesterol and low-density lipoprotein cholesterol) were associated with the prevalence of carotid plaque, consistent with previous studies (<xref ref-type="bibr" rid="B26">26</xref>, <xref ref-type="bibr" rid="B27">27</xref>). Furthermore, we included BMI and white blood cell count (WBC) as predictors in the XGBoost model. Elevated BMI is an important risk factor for carotid plaque formation, as it can increase peripheral vascular resistance, which in turn promotes plaque formation (<xref ref-type="bibr" rid="B28">28</xref>, <xref ref-type="bibr" rid="B29">29</xref>). One study has shown that the arteries of obese individuals begin to harden during adolescence (<xref ref-type="bibr" rid="B30">30</xref>), which emphasizes the importance of maintaining a normal BMI. A number of epidemiological studies have demonstrated a correlation between inflammatory biomarkers (e.g., white blood cell count) and the formation of carotid plaques (<xref ref-type="bibr" rid="B31">31</xref>, <xref ref-type="bibr" rid="B32">32</xref>). This is consistent with our findings. Furthermore, inflammation has been identified as a risk factor for carotid plaque even in individuals with a normal weight and a healthy metabolic profile (<xref ref-type="bibr" rid="B33">33</xref>).</p>
<p>In this study, we constructed a nomogram for the prediction of carotid plaque risk in miners based on the features identified by the &#x201C;XGBoost model&#x201D;. We then introduced the decision curve analysis (DCA) and the clinical impact curve (CIC) to evaluate the performance of the nomogram. The CIC is the weighted average of the absolute mean difference between the observed probability and the predicted probability. It can be used to quantitatively evaluate the results of binary classification and thus provide a more comprehensive evaluation of the effect of the nomogram (<xref ref-type="bibr" rid="B34">34</xref>).</p>
<p>This study is subject to several limitations. Firstly, the data used to train the model in this study was derived from the physical examination of miners, which is cross-sectional in nature and therefore unable to demonstrate a causal relationship between traits and diseases. Secondly, the features encompassed in this study remain insufficiently comprehensive. For instance, prior studies have demonstrated that night shift work is correlated with an elevated risk of carotid plaque (<xref ref-type="bibr" rid="B35">35</xref>), and night shift work is highly prevalent among miners. Night shift work is likely to have a direct bearing on miners&#x0027; health; the specific occupations of miners, such as coal miners, electricians, and ventilation workers, are associated with exposure to different levels of harmful gases and dust, which may seriously affect their health; therefore, failure to consider these factors may lead to biased research results. Thirdly, the research population chosen in this study pertains specifically to coal miners in a particular area, which might have an impact on the generalization of the results. The fact that the working conditions and living environments of coal miners in this area could differ from those in other regions or workers with diverse occupational backgrounds constrains the universality and generalizability of the research findings. Fourth, the dataset used in this study exhibits a significant class imbalance, with a much lower number of positive cases compared to negative cases. While this imbalance reflected real-world clinical scenarios and ensured the model&#x0027;s robustness, it may also pose challenges for model training and performance evaluation. Future studies could contemplate including night shift work as an independent variable and conducting research among coal miners in various regions, with distinct working conditions and living habits, to enhance the diversity of the sample and the representativeness of the research results. Additionally, future work may explore data balancing methods to further optimize model performance.</p>
</sec>
<sec id="s5" sec-type="conclusions"><label>5</label><title>Conclusions</title>
<p>In this study, we employed three machine learning methods to screen for features and constructed a predictive model for carotid plaque risk in coal miners using logistic regression. The XGBoost algorithm demonstrated the most effective performance in the screening of features, with an AUC, sensitivity, and specificity of 0.846, 0.867, and 0.702, respectively. This method contributes to the personalized risk assessment of carotid plaque in coal miners and has the potential to enhance the cost-effectiveness of carotid ultrasound testing.</p>
</sec>
</body>
<back>
<sec id="s6" sec-type="data-availability"><title>Data availability statement</title>
<p>The original contributions presented in the study are included in the article/<xref ref-type="sec" rid="s11">Supplementary Material</xref>, further inquiries can be directed to the corresponding authors.</p>
</sec>
<sec id="s7" sec-type="ethics-statement"><title>Ethics statement</title>
<p>The studies involving humans were approved by the Research Ethics Committee of the Second People&#x0027;s Hospital of Shanxi Province. The studies were conducted in accordance with the local legislation and institutional requirements. The participants provided their written informed consent to participate in this study.</p>
</sec>
<sec id="s8" sec-type="author-contributions"><title>Author contributions</title>
<p>Y-CL: Investigation, Methodology, Software, Validation, Visualization, Writing &#x2013; original draft, Writing &#x2013; review &#x0026; editing. T-RZ: Data curation, Investigation, Software, Validation, Writing &#x2013; original draft, Writing &#x2013; review &#x0026; editing. FZ: Data curation, Investigation, Methodology, Software, Writing &#x2013; review &#x0026; editing. C-QC: Data curation, Investigation, Methodology, Software, Writing &#x2013; review &#x0026; editing. Y-TY: Conceptualization, Data curation, Investigation, Software, Writing &#x2013; review &#x0026; editing. J-GH: Data curation, Investigation, Supervision, Writing &#x2013; review &#x0026; editing. J-RW: Data curation, Investigation, Writing &#x2013; review &#x0026; editing. JW: Data curation, Investigation, Software, Writing &#x2013; review &#x0026; editing. H-WG: Data curation, Investigation, Writing &#x2013; review &#x0026; editing. Y-BL: Data curation, Investigation, Writing &#x2013; review &#x0026; editing. M-ZL: Conceptualization, Formal analysis, Funding acquisition, Project administration, Resources, Writing &#x2013; review &#x0026; editing. L-JL: Conceptualization, Formal analysis, Funding acquisition, Project administration, Resources, Writing &#x2013; review &#x0026; editing.</p>
</sec>
<sec id="s9" sec-type="funding-information"><title>Funding</title>
<p>The author(s) declare that financial support was received for the research and/or publication of this article. The &#x201C;Four Batch&#x201D; of Technology-Driven Medical Innovation Plan in Shanxi province, China (2021XM43); Open Fund from Key Laboratory of Coal Environmental Pathogenicity and Prevention (Shanxi Medical University), Ministry of Education, China (CEPPOF202303) and Shanxi Province Higher Education &#x201C;Billion Project&#x201D; Science and Technology Guidance Project (BYBLD002).</p>
</sec>
<ack><title>Acknowledgments</title>
<p>We sincerely thank all study participants for providing information. In addition, we thank all the authors participating in this project for their efforts.</p>
</ack>
<sec id="s10" sec-type="COI-statement"><title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec id="s12" sec-type="disclaimer"><title>Publisher&#x0027;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec id="s11" sec-type="supplementary-material"><title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fcvm.2025.1490961/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fcvm.2025.1490961/full&#x0023;supplementary-material</ext-link></p>
<supplementary-material id="SD1" content-type="local-data">
<media mimetype="application" mime-subtype="pdf" xlink:href="Datasheet1.pdf"/></supplementary-material>
</sec>
<ref-list><title>References</title>
<ref id="B1"><label>1.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Saba</surname><given-names>L</given-names></name><name><surname>Cau</surname><given-names>R</given-names></name><name><surname>Murgia</surname><given-names>A</given-names></name><name><surname>Nicolaides</surname><given-names>AN</given-names></name><name><surname>Wintermark</surname><given-names>M</given-names></name><name><surname>Castillo</surname><given-names>M</given-names></name><etal/></person-group> <article-title>Carotid plaque-RADS: a novel stroke risk classification system</article-title>. <source>JACC Cardiovasc Imaging</source>. (<year>2024</year>) <volume>17</volume>:<fpage>62</fpage>&#x2013;<lpage>75</lpage>. <pub-id pub-id-type="doi">10.1016/j.jcmg.2023.09.005</pub-id><pub-id pub-id-type="pmid">37823860</pub-id></citation></ref>
<ref id="B2"><label>2.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bos</surname><given-names>D</given-names></name><name><surname>Arshi</surname><given-names>B</given-names></name><name><surname>Van Den Bouwhuijsen</surname><given-names>QJA</given-names></name><name><surname>Ikram</surname><given-names>MK</given-names></name><name><surname>Selwaness</surname><given-names>M</given-names></name><name><surname>Vernooij</surname><given-names>MW</given-names></name><etal/></person-group> <article-title>Atherosclerotic carotid plaque composition and incident stroke and coronary events</article-title>. <source>J Am Coll Cardiol</source>. (<year>2021</year>) <volume>77</volume>:<fpage>1426</fpage>&#x2013;<lpage>35</lpage>. <pub-id pub-id-type="doi">10.1016/j.jacc.2021.01.038</pub-id><pub-id pub-id-type="pmid">33736825</pub-id></citation></ref>
<ref id="B3"><label>3.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhao</surname><given-names>XQ</given-names></name><name><surname>Hatsukami</surname><given-names>TS</given-names></name></person-group>. <article-title>Risk factors for development of carotid plaque components</article-title>. <source>JACC Cardiovasc Imaging</source>. (<year>2018</year>) <volume>11</volume>:<fpage>193</fpage>&#x2013;<lpage>5</lpage>. <pub-id pub-id-type="doi">10.1016/j.jcmg.2016.12.027</pub-id><pub-id pub-id-type="pmid">28412422</pub-id></citation></ref>
<ref id="B4"><label>4.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Campbell</surname><given-names>BCV</given-names></name><name><surname>Khatri</surname><given-names>P</given-names></name></person-group>. <article-title>Stroke</article-title>. <source>Lancet</source>. (<year>2020</year>) <volume>396</volume>:<fpage>129</fpage>&#x2013;<lpage>42</lpage>. <pub-id pub-id-type="doi">10.1016/s0140-6736(20)31179-x</pub-id><pub-id pub-id-type="pmid">32653056</pub-id></citation></ref>
<ref id="B5"><label>5.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Guo</surname><given-names>J</given-names></name><name><surname>Wang</surname><given-names>H</given-names></name><name><surname>Li</surname><given-names>Y</given-names></name><name><surname>Zhu</surname><given-names>S</given-names></name><name><surname>Hu</surname><given-names>H</given-names></name><name><surname>Gu</surname><given-names>Z</given-names></name></person-group>. <article-title>Nanotechnology in coronary heart disease</article-title>. <source>Acta Biomater</source>. (<year>2023</year>) <volume>171</volume>:<fpage>37</fpage>&#x2013;<lpage>67</lpage>. <pub-id pub-id-type="doi">10.1016/j.actbio.2023.09.011</pub-id><pub-id pub-id-type="pmid">37714246</pub-id></citation></ref>
<ref id="B6"><label>6.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hakeem</surname><given-names>A</given-names></name><name><surname>Bhatti</surname><given-names>S</given-names></name><name><surname>Chang</surname><given-names>SM</given-names></name></person-group>. <article-title>Screening and risk stratification of coronary artery disease in end-stage renal disease</article-title>. <source>JACC Cardiovasc Imaging</source>. (<year>2014</year>) <volume>7</volume>:<fpage>715</fpage>&#x2013;<lpage>28</lpage>. <pub-id pub-id-type="doi">10.1016/j.jcmg.2013.12.015</pub-id><pub-id pub-id-type="pmid">25034921</pub-id></citation></ref>
<ref id="B7"><label>7.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname><given-names>W</given-names></name><name><surname>Wu</surname><given-names>YF</given-names></name><name><surname>Zhao</surname><given-names>D</given-names></name><name><surname>Yang</surname><given-names>Y</given-names></name><name><surname>Lang</surname><given-names>LR</given-names></name><name><surname>Wang</surname><given-names>M</given-names></name><etal/></person-group> <article-title>Distribution characteristics and risk factors of carotid atherosclerosis in middle-aged and elderly Chinese</article-title>. <source>Zhonghua Xin Xue Guan Bing Za Zhi</source>. (<year>2010</year>) <volume>38</volume>:<fpage>553</fpage>&#x2013;<lpage>7</lpage>.<pub-id pub-id-type="pmid">21033140</pub-id></citation></ref>
<ref id="B8"><label>8.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Liu</surname><given-names>S</given-names></name><name><surname>Li</surname><given-names>Y</given-names></name><name><surname>Zeng</surname><given-names>X</given-names></name><name><surname>Wang</surname><given-names>H</given-names></name><name><surname>Yin</surname><given-names>P</given-names></name><name><surname>Wang</surname><given-names>L</given-names></name><etal/></person-group> <article-title>Burden of cardiovascular diseases in China, 1990&#x2013;2016: findings from the 2016 global burden of disease study</article-title>. <source>JAMA Cardiol</source>. (<year>2019</year>) <volume>4</volume>:<fpage>342</fpage>&#x2013;<lpage>52</lpage>. <pub-id pub-id-type="doi">10.1001/jamacardio.2019.0295</pub-id><pub-id pub-id-type="pmid">30865215</pub-id></citation></ref>
<ref id="B9"><label>9.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wu</surname><given-names>JH</given-names></name><name><surname>Zhang</surname><given-names>L</given-names></name><name><surname>Wang</surname><given-names>J</given-names></name><name><surname>Li</surname><given-names>J</given-names></name><name><surname>Wang</surname><given-names>HD</given-names></name><name><surname>Li</surname><given-names>XM</given-names></name><etal/></person-group> <article-title>Association between occupational stress and carotid atherosclerosis among the workers in a steel plant</article-title>. <source>Zhonghua Lao Dong Wei Sheng Zhi Ye Bing Za Zhi</source>. (<year>2020</year>) <volume>38</volume>:<fpage>262</fpage>&#x2013;<lpage>8</lpage>. <pub-id pub-id-type="doi">10.3760/cma.j.cn121094-20190401-00125</pub-id><pub-id pub-id-type="pmid">32447888</pub-id></citation></ref>
<ref id="B10"><label>10.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Liu</surname><given-names>L</given-names></name><name><surname>Wen</surname><given-names>F</given-names></name><name><surname>Xu</surname><given-names>X</given-names></name><name><surname>Wang</surname><given-names>L</given-names></name></person-group>. <article-title>Effective resources for improving mental health among Chinese underground coal miners: perceived organizational support and psychological capital</article-title>. <source>J Occup Health</source>. (<year>2015</year>) <volume>57</volume>:<fpage>58</fpage>&#x2013;<lpage>68</lpage>. <pub-id pub-id-type="doi">10.1539/joh.14-0082-OA</pub-id><pub-id pub-id-type="pmid">25410268</pub-id></citation></ref>
<ref id="B11"><label>11.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Liu</surname><given-names>FD</given-names></name><name><surname>Pan</surname><given-names>ZQ</given-names></name><name><surname>Liu</surname><given-names>SL</given-names></name><name><surname>Chen</surname><given-names>L</given-names></name><name><surname>Ma</surname><given-names>JZ</given-names></name><name><surname>Yang</surname><given-names>ML</given-names></name><etal/></person-group> <article-title>The estimation of the number of underground coal miners and the annual dose to coal miners in China</article-title>. <source>Health Phys</source>. (<year>2007</year>) <volume>93</volume>:<fpage>127</fpage>&#x2013;<lpage>32</lpage>. <pub-id pub-id-type="doi">10.1097/01.HP.0000261600.29366.b4</pub-id><pub-id pub-id-type="pmid">17622817</pub-id></citation></ref>
<ref id="B12"><label>12.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Xie</surname><given-names>Y</given-names></name><name><surname>He</surname><given-names>W</given-names></name><name><surname>Zhang</surname><given-names>X</given-names></name><name><surname>Cui</surname><given-names>J</given-names></name><name><surname>Tian</surname><given-names>X</given-names></name><name><surname>Chen</surname><given-names>J</given-names></name><etal/></person-group> <article-title>Association of air pollution and greenness with carotid plaque: a prospective cohort study in China</article-title>. <source>Environ Pollut</source>. (<year>2021</year>) <volume>273</volume>:<fpage>116514</fpage>. <pub-id pub-id-type="doi">10.1016/j.envpol.2021.116514</pub-id><pub-id pub-id-type="pmid">33486240</pub-id></citation></ref>
<ref id="B13"><label>13.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wong</surname><given-names>R</given-names></name><name><surname>Crane</surname><given-names>A</given-names></name><name><surname>Sheth</surname><given-names>J</given-names></name><name><surname>Mayrovitz</surname><given-names>HN</given-names></name></person-group>. <article-title>Shift work as a cardiovascular disease risk factor: a narrative review</article-title>. <source>Cureus</source>. (<year>2023</year>) <volume>15</volume>:<fpage>e41186</fpage>. <pub-id pub-id-type="doi">10.7759/cureus.41186</pub-id><pub-id pub-id-type="pmid">37525789</pub-id></citation></ref>
<ref id="B14"><label>14.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sugiura</surname><given-names>T</given-names></name><name><surname>Dohi</surname><given-names>Y</given-names></name><name><surname>Takagi</surname><given-names>Y</given-names></name><name><surname>Yoshikane</surname><given-names>N</given-names></name><name><surname>Ito</surname><given-names>M</given-names></name><name><surname>Suzuki</surname><given-names>K</given-names></name><etal/></person-group> <article-title>Impacts of lifestyle behavior and shift work on visceral fat accumulation and the presence of atherosclerosis in middle-aged male workers</article-title>. <source>Hypertens Res</source>. (<year>2020</year>) <volume>43</volume>:<fpage>235</fpage>&#x2013;<lpage>45</lpage>. <pub-id pub-id-type="doi">10.1038/s41440-019-0362-z</pub-id><pub-id pub-id-type="pmid">31780790</pub-id></citation></ref>
<ref id="B15"><label>15.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wu</surname><given-names>D</given-names></name><name><surname>Cui</surname><given-names>G</given-names></name><name><surname>Huang</surname><given-names>X</given-names></name><name><surname>Chen</surname><given-names>Y</given-names></name><name><surname>Liu</surname><given-names>G</given-names></name><name><surname>Ren</surname><given-names>L</given-names></name><etal/></person-group> <article-title>An accurate and explainable ensemble learning method for carotid plaque prediction in an asymptomatic population</article-title>. <source>Comput Methods Programs Biomed</source>. (<year>2022</year>) <volume>221</volume>:<fpage>106842</fpage>. <pub-id pub-id-type="doi">10.1016/j.cmpb.2022.106842</pub-id><pub-id pub-id-type="pmid">35569238</pub-id></citation></ref>
<ref id="B16"><label>16.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Damen</surname><given-names>JA</given-names></name><name><surname>Hooft</surname><given-names>L</given-names></name><name><surname>Schuit</surname><given-names>E</given-names></name><name><surname>Debray</surname><given-names>TP</given-names></name><name><surname>Collins</surname><given-names>GS</given-names></name><name><surname>Tzoulaki</surname><given-names>I</given-names></name><etal/></person-group> <article-title>Prediction models for cardiovascular disease risk in the general population: systematic review</article-title>. <source>Br Med J</source>. (<year>2016</year>) <volume>353</volume>:<fpage>i2416</fpage>. <pub-id pub-id-type="doi">10.1136/bmj.i2416</pub-id></citation></ref>
<ref id="B17"><label>17.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Moons</surname><given-names>KG</given-names></name><name><surname>Kengne</surname><given-names>AP</given-names></name><name><surname>Woodward</surname><given-names>M</given-names></name><name><surname>Royston</surname><given-names>P</given-names></name><name><surname>Vergouwe</surname><given-names>Y</given-names></name><name><surname>Altman</surname><given-names>DG</given-names></name><etal/></person-group> <article-title>Risk prediction models: i. Development, internal validation, and assessing the incremental value of a new (bio)marker</article-title>. <source>Heart</source>. (<year>2012</year>) <volume>98</volume>:<fpage>683</fpage>&#x2013;<lpage>90</lpage>. <pub-id pub-id-type="doi">10.1136/heartjnl-2011-301246</pub-id><pub-id pub-id-type="pmid">22397945</pub-id></citation></ref>
<ref id="B18"><label>18.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bin</surname><given-names>C</given-names></name><name><surname>Li</surname><given-names>Q</given-names></name><name><surname>Tang</surname><given-names>J</given-names></name><name><surname>Dai</surname><given-names>C</given-names></name><name><surname>Jiang</surname><given-names>T</given-names></name><name><surname>Xie</surname><given-names>X</given-names></name><etal/></person-group> <article-title>Machine learning models for predicting the risk factor of carotid plaque in cardiovascular disease</article-title>. <source>Front Cardiovasc Med</source>. (<year>2023</year>) <volume>10</volume>:<fpage>1178782</fpage>. <pub-id pub-id-type="doi">10.3389/fcvm.2023.1178782</pub-id><pub-id pub-id-type="pmid">37808888</pub-id></citation></ref>
<ref id="B19"><label>19.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Weng</surname><given-names>S</given-names></name><name><surname>Chen</surname><given-names>J</given-names></name><name><surname>Ding</surname><given-names>C</given-names></name><name><surname>Hu</surname><given-names>D</given-names></name><name><surname>Liu</surname><given-names>W</given-names></name><name><surname>Yang</surname><given-names>Y</given-names></name><etal/></person-group> <article-title>Utilizing machine learning algorithms for the prediction of carotid artery plaques in a Chinese population</article-title>. <source>Front Physiol</source>. (<year>2023</year>) <volume>14</volume>:<fpage>1295371</fpage>. <pub-id pub-id-type="doi">10.3389/fphys.2023.1295371</pub-id><pub-id pub-id-type="pmid">38028761</pub-id></citation></ref>
<ref id="B20"><label>20.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hsiao</surname><given-names>CL</given-names></name><name><surname>Chen</surname><given-names>PY</given-names></name><name><surname>Hsu</surname><given-names>PJ</given-names></name><name><surname>Lin</surname><given-names>SK</given-names></name></person-group>. <article-title>Nomogram and carotid risk score for predicting moderate or high carotid atherosclerosis among asymptomatic elderly recycling volunteers</article-title>. <source>Diagnostics (Basel)</source>. (<year>2022</year>) <volume>12</volume>(<issue>6</issue>):<fpage>1407</fpage>. <pub-id pub-id-type="doi">10.3390/diagnostics12061407</pub-id><pub-id pub-id-type="pmid">35741217</pub-id></citation></ref>
<ref id="B21"><label>21.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhang</surname><given-names>Y</given-names></name><name><surname>Wu</surname><given-names>Z</given-names></name><name><surname>Li</surname><given-names>X</given-names></name><name><surname>Wei</surname><given-names>J</given-names></name><name><surname>Zhang</surname><given-names>Q</given-names></name><name><surname>Wang</surname><given-names>J</given-names></name></person-group>. <article-title>Association between the triglyceride-glucose index and carotid plaque incidence: a longitudinal study</article-title>. <source>Cardiovasc Diabetol</source>. (<year>2022</year>) <volume>21</volume>:<fpage>244</fpage>. <pub-id pub-id-type="doi">10.1186/s12933-022-01683-6</pub-id><pub-id pub-id-type="pmid">36380351</pub-id></citation></ref>
<ref id="B22"><label>22.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yu</surname><given-names>H</given-names></name><name><surname>Li</surname><given-names>Y</given-names></name><name><surname>Tao</surname><given-names>L</given-names></name><name><surname>Yang</surname><given-names>L</given-names></name><name><surname>Liu</surname><given-names>D</given-names></name><name><surname>Wang</surname><given-names>Y</given-names></name><etal/></person-group> <article-title>Trajectories of lipid profile and risk of carotid atherosclerosis progression: a longitudinal cohort study</article-title>. <source>Nutrients</source>. (<year>2022</year>) <volume>14</volume>(<issue>15</issue>):<fpage>3243</fpage>. <pub-id pub-id-type="doi">10.3390/nu14153243</pub-id><pub-id pub-id-type="pmid">35956420</pub-id></citation></ref>
<ref id="B23"><label>23.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hao</surname><given-names>CN</given-names></name><name><surname>Shi</surname><given-names>YQ</given-names></name><name><surname>Huang</surname><given-names>JJ</given-names></name><name><surname>Li</surname><given-names>HY</given-names></name><name><surname>Huang</surname><given-names>ZH</given-names></name><name><surname>Cheng</surname><given-names>XW</given-names></name><etal/></person-group> <article-title>The power combination of blood-pressure parameters to predict the incidence of plaque formation in carotid arteries in elderly</article-title>. <source>Int J Clin Exp Med</source>. (<year>2013</year>) <volume>6</volume>:<fpage>461</fpage>&#x2013;<lpage>9</lpage>.<pub-id pub-id-type="pmid">23844270</pub-id></citation></ref>
<ref id="B24"><label>24.</label><citation citation-type="journal"><collab>NCD Risk Factor Collaboration (NCD-RisC)</collab>. <article-title>Worldwide trends in blood pressure from 1975 to 2015: a pooled analysis of 1479 population-based measurement studies with 19&#x00B7;1 million participants</article-title>. <source>Lancet</source> (<year>2017</year>) <volume>389</volume>(10064):<fpage>37</fpage>&#x2013;<lpage>55</lpage>. <pub-id pub-id-type="doi">10.1016/s0140-6736(16)31919-5</pub-id>. Erratum in: <italic>Lancet</italic>. (2020) 396(10255):886. doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1016/S0140-6736(20)31972-3">10.1016/S0140-6736(20)31972-3</ext-link><pub-id pub-id-type="pmid">27863813</pub-id></citation></ref>
<ref id="B25"><label>25.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kleipool</surname><given-names>EEF</given-names></name><name><surname>Rozendaal</surname><given-names>ES</given-names></name><name><surname>Mahadew</surname><given-names>SKN</given-names></name><name><surname>Kramer</surname><given-names>MHH</given-names></name><name><surname>Van Den Born</surname><given-names>BH</given-names></name><name><surname>Sern&#x00E9;</surname><given-names>EH</given-names></name><etal/></person-group> <article-title>The value of ambulatory blood pressure measurement to detect masked diastolic hypotension in older patients treated for hypertension</article-title>. <source>Age Ageing</source>. (<year>2021</year>) <volume>50</volume>(<issue>10064</issue>):<fpage>1229</fpage>&#x2013;<lpage>35</lpage>. <pub-id pub-id-type="doi">10.1093/ageing/afaa287</pub-id><pub-id pub-id-type="pmid">33454734</pub-id></citation></ref>
<ref id="B26"><label>26.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Liu</surname><given-names>Y</given-names></name><name><surname>Zhu</surname><given-names>Y</given-names></name><name><surname>Jia</surname><given-names>W</given-names></name><name><surname>Sun</surname><given-names>D</given-names></name><name><surname>Zhao</surname><given-names>L</given-names></name><name><surname>Zhang</surname><given-names>C</given-names></name><etal/></person-group> <article-title>Association between lipid profiles and presence of carotid plaque</article-title>. <source>Sci Rep</source>. (<year>2019</year>) <volume>9</volume>:<fpage>18011</fpage>. <pub-id pub-id-type="doi">10.1038/s41598-019-54285-w</pub-id><pub-id pub-id-type="pmid">31784590</pub-id></citation></ref>
<ref id="B27"><label>27.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhan</surname><given-names>C</given-names></name><name><surname>Shi</surname><given-names>M</given-names></name><name><surname>Yang</surname><given-names>Y</given-names></name><name><surname>Pang</surname><given-names>H</given-names></name><name><surname>Fei</surname><given-names>S</given-names></name><name><surname>Bai</surname><given-names>L</given-names></name><etal/></person-group> <article-title>Prevalence and risk factors of carotid plaque among middle-aged and elderly adults in rural Tianjin, China</article-title>. <source>Sci Rep</source>. (<year>2016</year>) <volume>6</volume>:<fpage>23870</fpage>. <pub-id pub-id-type="doi">10.1038/srep23870</pub-id><pub-id pub-id-type="pmid">27029785</pub-id></citation></ref>
<ref id="B28"><label>28.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Xi</surname><given-names>J</given-names></name><name><surname>Men</surname><given-names>S</given-names></name><name><surname>Nan</surname><given-names>J</given-names></name><name><surname>Yang</surname><given-names>Q</given-names></name><name><surname>Dong</surname><given-names>J</given-names></name></person-group>. <article-title>The blood monocyte to high density lipoprotein cholesterol ratio (MHR) is a possible marker of carotid artery plaque</article-title>. <source>Lipids Health Dis</source>. (<year>2022</year>) <volume>21</volume>:<fpage>130</fpage>. <pub-id pub-id-type="doi">10.1186/s12944-022-01741-8</pub-id><pub-id pub-id-type="pmid">36463176</pub-id></citation></ref>
<ref id="B29"><label>29.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Shen</surname><given-names>P</given-names></name><name><surname>Zhou</surname><given-names>Y</given-names></name><name><surname>Song</surname><given-names>A</given-names></name><name><surname>Wan</surname><given-names>Y</given-names></name><name><surname>Fan</surname><given-names>Z</given-names></name><name><surname>Xu</surname><given-names>R</given-names></name></person-group>. <article-title>The association of metabolic health obesity with incidence of carotid artery plaque in Chinese adults</article-title>. <source>Nutr Metab Cardiovasc Dis</source>. (<year>2021</year>) <volume>31</volume>:<fpage>2376</fpage>&#x2013;<lpage>81</lpage>. <pub-id pub-id-type="doi">10.1016/j.numecd.2021.05.003</pub-id><pub-id pub-id-type="pmid">34154886</pub-id></citation></ref>
<ref id="B30"><label>30.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Botvin Moshe</surname><given-names>C</given-names></name><name><surname>Haratz</surname><given-names>S</given-names></name><name><surname>Ravona-Springer</surname><given-names>R</given-names></name><name><surname>Heymann</surname><given-names>A</given-names></name><name><surname>Hung-Mo</surname><given-names>L</given-names></name><name><surname>Schnaider Beeri</surname><given-names>M</given-names></name><etal/></person-group> <article-title>Long-term trajectories of BMI predict carotid stiffness and plaque volume in type 2 diabetes older adults: a cohort study</article-title>. <source>Cardiovasc Diabetol</source>. (<year>2020</year>) <volume>19</volume>:<fpage>138</fpage>. <pub-id pub-id-type="doi">10.1186/s12933-020-01104-6</pub-id><pub-id pub-id-type="pmid">32933542</pub-id></citation></ref>
<ref id="B31"><label>31.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Elkind</surname><given-names>MS</given-names></name><name><surname>Cheng</surname><given-names>J</given-names></name><name><surname>Boden-Albala</surname><given-names>B</given-names></name><name><surname>Paik</surname><given-names>MC</given-names></name><name><surname>Sacco</surname><given-names>RL</given-names></name></person-group>. <article-title>Elevated white blood cell count and carotid plaque thickness: the northern Manhattan stroke study</article-title>. <source>Stroke</source>. (<year>2001</year>) <volume>32</volume>:<fpage>842</fpage>&#x2013;<lpage>9</lpage>. <pub-id pub-id-type="doi">10.1161/01.str.32.4.842</pub-id><pub-id pub-id-type="pmid">11283380</pub-id></citation></ref>
<ref id="B32"><label>32.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ortega</surname><given-names>E</given-names></name><name><surname>Gilabert</surname><given-names>R</given-names></name><name><surname>Nu&#x00F1;ez</surname><given-names>I</given-names></name><name><surname>Cof&#x00E1;n</surname><given-names>M</given-names></name><name><surname>Sala-Vila</surname><given-names>A</given-names></name><name><surname>De Groot</surname><given-names>E</given-names></name><etal/></person-group> <article-title>White blood cell count is associated with carotid and femoral atherosclerosis</article-title>. <source>Atherosclerosis</source>. (<year>2012</year>) <volume>221</volume>:<fpage>275</fpage>&#x2013;<lpage>81</lpage>. <pub-id pub-id-type="doi">10.1016/j.atherosclerosis.2011.12.038</pub-id><pub-id pub-id-type="pmid">22244768</pub-id></citation></ref>
<ref id="B33"><label>33.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhang</surname><given-names>X</given-names></name><name><surname>Zhang</surname><given-names>T</given-names></name><name><surname>Wu</surname><given-names>C</given-names></name><name><surname>Zhou</surname><given-names>Y</given-names></name><name><surname>Chen</surname><given-names>Z</given-names></name><name><surname>Xu</surname><given-names>R</given-names></name></person-group>. <article-title>The association between inflammatory biomarkers and carotid artery plaque in normal-weight and metabolically healthy Chinese adults: a cross-sectional study</article-title>. <source>Hypertens Res</source>. (<year>2023</year>) <volume>46</volume>:<fpage>330</fpage>&#x2013;<lpage>8</lpage>. <pub-id pub-id-type="doi">10.1038/s41440-022-01062-4</pub-id><pub-id pub-id-type="pmid">36224287</pub-id></citation></ref>
<ref id="B34"><label>34.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Austin</surname><given-names>PC</given-names></name><name><surname>Steyerberg</surname><given-names>EW</given-names></name></person-group>. <article-title>The integrated calibration Index (ICI) and related metrics for quantifying the calibration of logistic regression models</article-title>. <source>Stat Med</source>. (<year>2019</year>) <volume>38</volume>:<fpage>4051</fpage>&#x2013;<lpage>65</lpage>. <pub-id pub-id-type="doi">10.1002/sim.8281</pub-id><pub-id pub-id-type="pmid">31270850</pub-id></citation></ref>
<ref id="B35"><label>35.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname><given-names>L</given-names></name><name><surname>Zhang</surname><given-names>S</given-names></name><name><surname>Yu</surname><given-names>M</given-names></name><name><surname>Yuan</surname><given-names>J</given-names></name></person-group>. <article-title>Association between rotating night shift work and carotid atherosclerosis among Chinese steelworkers: a cross-sectional survey</article-title>. <source>Hypertens Res</source>. (<year>2022</year>) <volume>45</volume>:<fpage>686</fpage>&#x2013;<lpage>97</lpage>. <pub-id pub-id-type="doi">10.1038/s41440-021-00821-z</pub-id><pub-id pub-id-type="pmid">35145252</pub-id></citation></ref></ref-list>
</back>
</article>