<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article article-type="research-article" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Cardiovasc. Med.</journal-id>
<journal-title>Frontiers in Cardiovascular Medicine</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Cardiovasc. Med.</abbrev-journal-title>
<issn pub-type="epub">2297-055X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fcvm.2024.1392752</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Cardiovascular Medicine</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Screening for carotid atherosclerosis: development and validation of a high-precision risk scoring tool</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" corresp="yes"><name><surname>Huang</surname><given-names>Zhi-Xin</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="corresp" rid="cor1">&#x002A;</xref><uri xlink:href="https://loop.frontiersin.org/people/554933/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
</contrib>
<contrib contrib-type="author"><name><surname>Chen</surname><given-names>Lijuan</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
</contrib>
<contrib contrib-type="author"><name><surname>Chen</surname><given-names>Ping</given-names></name>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
</contrib>
<contrib contrib-type="author"><name><surname>Dai</surname><given-names>Yingyi</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
</contrib>
<contrib contrib-type="author"><name><surname>Lu</surname><given-names>Haike</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
</contrib>
<contrib contrib-type="author"><name><surname>Liang</surname><given-names>Yicheng</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
</contrib>
<contrib contrib-type="author"><name><surname>Ding</surname><given-names>Qingguo</given-names></name>
<xref ref-type="aff" rid="aff5"><sup>5</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
</contrib>
<contrib contrib-type="author"><name><surname>Liang</surname><given-names>Piaonan</given-names></name>
<xref ref-type="aff" rid="aff6"><sup>6</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
</contrib>
</contrib-group>
<aff id="aff1"><label><sup>1</sup></label><institution>Department of Neurology, The Affiliated Guangdong Second Provincial General Hospital of Jinan University</institution>, <addr-line>Guangzhou, Guangdong</addr-line>, <country>China</country></aff>
<aff id="aff2"><label><sup>2</sup></label><institution>Guangzhou University of Chinese Medicine</institution>, <addr-line>Guangzhou, Guangdong</addr-line>, <country>China</country></aff>
<aff id="aff3"><label><sup>3</sup></label><institution>Department of Ultrasound, Songyang County People&#x2019;s Hospital</institution>, <addr-line>Lishui, Zhejiang</addr-line>, <country>China</country></aff>
<aff id="aff4"><label><sup>4</sup></label><institution>Department of Neurology, The First Hospital of Putian City</institution>, <addr-line>Putian, Fujiang</addr-line>, <country>China</country></aff>
<aff id="aff5"><label><sup>5</sup></label><institution>Department of Neurology, Nanhai Economic Development Zone Peoples Hospital</institution>, <addr-line>Foshan, Guangdong</addr-line>, <country>China</country></aff>
<aff id="aff6"><label><sup>6</sup></label>Department of Rehabilitation Medicine, <institution>The Affiliated Guangdong Second Provincial General Hospital of Jinan University</institution>, Guangzhou, Guangdong, <country>China</country></aff>
<author-notes>
<fn fn-type="edited-by"><p><bold>Edited by:</bold> Teresa Padro, Institut de Recerca de l&#x0027;Hospital de la Santa Creu i Sant Pau, Spain</p></fn>
<fn fn-type="edited-by"><p><bold>Reviewed by:</bold> Oscar Rafael Escate Ch&#x00E1;vez, Sant Pau Institute for Biomedical Research, Spain</p>
<p>Dalin Tang, Worcester Polytechnic Institute, United States</p></fn>
<corresp id="cor1"><label>&#x002A;</label><bold>Correspondence:</bold> Zhi-Xin Huang <email>hzxd6@163.com</email></corresp>
</author-notes>
<pub-date pub-type="epub"><day>25</day><month>07</month><year>2024</year></pub-date>
<pub-date pub-type="collection"><year>2024</year></pub-date>
<volume>11</volume><elocation-id>1392752</elocation-id>
<history>
<date date-type="received"><day>28</day><month>02</month><year>2024</year></date>
<date date-type="accepted"><day>15</day><month>07</month><year>2024</year></date>
</history>
<permissions>
<copyright-statement>&#x00A9; 2024 Huang, Chen, Chen, Dai, Lu, Liang, Ding and Liang.</copyright-statement>
<copyright-year>2024</copyright-year><copyright-holder>Huang, Chen, Chen, Dai, Lu, Liang, Ding and Liang</copyright-holder><license license-type="open-access" xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="http://creativecommons.org/licenses/by/4.0/">Creative Commons Attribution License (CC BY)</ext-link>. The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p></license>
</permissions>
<abstract>
<sec><title>Objective</title>
<p>This study aimed to investigate the prevalence of carotid atherosclerosis (CAS), especially among seniors, and develop a precise risk assessment tool to facilitate screening and early intervention for high-risk individuals.</p>
</sec>
<sec><title>Methods</title>
<p>A comprehensive approach was employed, integrating traditional epidemiological methods with advanced machine learning techniques, including support vector machines, XGBoost, decision trees, random forests, and logistic regression.</p>
</sec>
<sec><title>Results</title>
<p>Among 1,515 participants, CAS prevalence reached 57.4&#x0025;, concentrated within older individuals. Positive correlations were identified with age, systolic blood pressure, a history of hypertension, male gender, and total cholesterol. High-density lipoprotein (HDL) emerged as a protective factor against CAS, with total cholesterol and HDL levels proving significant predictors.</p>
</sec>
<sec><title>Conclusions</title>
<p>This research illuminates the risk factors linked to CAS and introduces a validated risk scoring tool, highlighted by the logistic classifier&#x0027;s consistent performance during training and testing. This tool shows potential for pinpointing high-risk individuals in community health programs, streamlining screening and intervention by clinical physicians. By stressing the significance of managing cholesterol levels, especially HDL, our findings provide actionable insights for CAS prevention. Nonetheless, rigorous validation is paramount to guarantee its practicality and efficacy in real-world scenarios.</p>
</sec>
</abstract>
<kwd-group>
<kwd>prevention</kwd>
<kwd>cerebrovascular disease</kwd>
<kwd>screening</kwd>
<kwd>ultrasound</kwd>
<kwd>machine learning</kwd>
<kwd>carotid atherosclerosis</kwd>
</kwd-group>
<contract-num rid="cn001">2024B03J0436</contract-num>
<contract-num rid="cn002">B2021382</contract-num>
<contract-sponsor id="cn001">Science and Technology Program of Guangzhou, China</contract-sponsor>
<contract-sponsor id="cn002">Medical Scientific Research Foundation of Guangdong Province, China</contract-sponsor>
<counts>
<fig-count count="4"/>
<table-count count="4"/><equation-count count="3"/><ref-count count="16"/><page-count count="10"/><word-count count="0"/></counts><custom-meta-wrap><custom-meta><meta-name>section-at-acceptance</meta-name><meta-value>Atherosclerosis and Vascular Medicine</meta-value></custom-meta></custom-meta-wrap>
</article-meta>
</front>
<body>
<sec id="s1" sec-type="intro"><title>Introduction</title>
<p>Carotid atherosclerosis (CAS) is not just an indication of systemic atherosclerosis in the carotid arteries; its implications extend far beyond that (<xref ref-type="bibr" rid="B1">1</xref>, <xref ref-type="bibr" rid="B2">2</xref>). Firstly, CAS had garnered significant attention due to its close association with stroke (<xref ref-type="bibr" rid="B3">3</xref>), a grave health concern where CAS was recognized as a major contributing factor. Notably, asymptomatic CAS exhibits a high prevalence of up to 40&#x0025; among middle-aged and elderly individuals, implying that it may have remained unnoticed in many individuals (<xref ref-type="bibr" rid="B4">4</xref>). Rupture of atherosclerotic plaques in the carotid arteries could trigger transient ischemic attacks and strokes, profoundly impacting patients&#x2019; lives. Moreover, given atherosclerosis was a systemic disease, there exists a close relationship between CAS and coronary atherosclerosis, further elevating the risk of cardiovascular and cerebrovascular diseases (<xref ref-type="bibr" rid="B5">5</xref>, <xref ref-type="bibr" rid="B6">6</xref>). These multiple hazards underscored the urgent need for in-depth research and management of CAS.</p>
<p>In the process of studying and managing CAS, ultrasound diagnosis played a pivotal role (<xref ref-type="bibr" rid="B7">7</xref>). Carotid ultrasound examination provides crucial insights into the disease severity. It facilitated early diagnosis and monitoring of disease progression by quantifying carotid intima-media thickness (CIMT) and detecting carotid atherosclerotic plaques (CAP) (<xref ref-type="bibr" rid="B8">8</xref>, <xref ref-type="bibr" rid="B9">9</xref>). This non-invasive tool boasted safety benefits without radiation risks while remaining applicable across extensive age groups from children to seniors. These advantages made ultrasound diagnosis a powerful methodology for elucidating the underpinnings and clinical approaches for CAS. Our focus was on the overlooked community populations. We utilized ultrasound techniques for CAS screening, aiming to ascertain subjects at risk and further evaluate associated factors. This endeavor provides valuable data that could enable the establishment of a robust scoring model to accurately evaluate CAS risks in patients and tailor preventive tactics. Through this study, we aim to thoroughly characterize and strategize management of CAS, especially in community settings, filling knowledge gaps to enhance screening and care.</p>
</sec>
<sec id="s2" sec-type="methods"><title>Methods</title>
<sec id="s2a"><title>Study population</title>
<p>The study protocol was reviewed and approved by the Ethical Committee of Guangdong Second Provincial General Hospital (Approval number: GD2H-KY IRB-AF-SC.07-01.2), and the ethical guidelines of the 1975 Declaration of Helsinki were followed.</p>
<p>A prospective longitudinal study named Ivy Action was performed in the form of a voluntary prevention screening program for ischemic cerebrovascular disease targeting the adult population of multicenter communities (Guangzhou) in 2018&#x2013;2019. The study included individuals aged 35 years or older, who had no history of stroke or had experienced a good recovery after stroke with a modified Rankin scale score of 2 or less indicating good recovery. Exclusion criteria included individuals unable to communicate with the research team, those with mobility impairments hindering study participation, individuals with heart, liver, or kidney failure, and patients with a history of malignancy. The comprehensive study protocol included gathering information on basic socio-economic status, social and residential status, smoking, housework, physical activity, sleep and dietary habits. Additionally, cardiovascular risk factors, family history and medical history were meticulously recorded.</p>
<p>In our machine learning models, we employed a comprehensive set of risk factors, including age, gender, biomarkers, systolic and diastolic blood pressure, health status, lifestyle factors, family history of cardiovascular disease, and medical history (<xref ref-type="table" rid="T1">Table&#x00A0;1</xref>). These factors were chosen for their well-documented association with carotid atherosclerosis and their clinical significance in predicting cardiovascular events. The medical exam included non-invasive tests (resting blood pressure, anthropometric measurements), ECG, anxiety and depression Scale, venous blood tests performed in a central laboratory with conventional enzymatic methods, echocardiography and carotid duplex scans (<xref ref-type="bibr" rid="B10">10</xref>). Waist and hip circumference were measured with light clothing. Cardiac History encompasses any medical history of coronary artery disease, myocardial infarction, angina, atrial fibrillation, or valvular heart disease. A waist-to-hip ratio over 0.90 for men and &#x003E;0.85 for women was considered central obesity.</p>
<table-wrap id="T1" position="float"><label>Table 1</label>
<caption><p>Demographic information for participants.</p></caption>
<table frame="hsides" rules="groups">
<colgroup>
<col align="left"/>
<col align="center"/>
<col align="center"/>
</colgroup>
<thead>
<tr>
<th valign="top" align="left">Characteristic</th>
<th valign="top" align="center">No, <italic>N</italic>&#x2009;&#x003D;&#x2009;646<xref ref-type="table-fn" rid="table-fn1"><sup>a</sup></xref></th>
<th valign="top" align="center">Yes, <italic>N</italic>&#x2009;&#x003D;&#x2009;869<xref ref-type="table-fn" rid="table-fn1"><sup>a</sup></xref></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left" colspan="3">Sex</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Male</td>
<td valign="top" align="center">157 (24&#x0025;)</td>
<td valign="top" align="center">350 (40&#x0025;)</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Female</td>
<td valign="top" align="center">489 (76&#x0025;)</td>
<td valign="top" align="center">519 (60&#x0025;)</td>
</tr>
<tr>
<td valign="top" align="left">Age</td>
<td valign="top" align="center">54 (45, 60)</td>
<td valign="top" align="center">63 (59, 68)</td>
</tr>
<tr>
<td valign="top" align="left" colspan="3">Biomarkers</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;hsCRP</td>
<td valign="top" align="center">0.85 (0.43, 1.78)</td>
<td valign="top" align="center">1.14 (0.59, 2.39)</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;&#x2003;Unknown</td>
<td valign="top" align="center">2</td>
<td valign="top" align="center">5</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Uric Acid</td>
<td valign="top" align="center">329 (274, 396)</td>
<td valign="top" align="center">351 (297, 428)</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;&#x2003;Unknown</td>
<td valign="top" align="center">2</td>
<td valign="top" align="center">2</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Hemoglobin</td>
<td valign="top" align="center">5.60 (5.30, 5.80)</td>
<td valign="top" align="center">5.70 (5.50, 6.10)</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;&#x2003;Unknown</td>
<td valign="top" align="center">2</td>
<td valign="top" align="center">2</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Glucose</td>
<td valign="top" align="center">4.69 (4.34, 5.18)</td>
<td valign="top" align="center">5.03 (4.58, 5.91)</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;&#x2003;Unknown</td>
<td valign="top" align="center">2</td>
<td valign="top" align="center">2</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Homocysteine</td>
<td valign="top" align="center">10.4 (8.8, 12.6)</td>
<td valign="top" align="center">11.7 (9.8, 14.3)</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;&#x2003;Unknown</td>
<td valign="top" align="center">2</td>
<td valign="top" align="center">2</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;LDL</td>
<td valign="top" align="center">2.83 (2.37, 3.30)</td>
<td valign="top" align="center">3.00 (2.45, 3.63)</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;&#x2003;Unknown</td>
<td valign="top" align="center">2</td>
<td valign="top" align="center">2</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;TG</td>
<td valign="top" align="center">1.27 (0.93, 1.90)</td>
<td valign="top" align="center">1.50 (1.10, 2.08)</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;&#x2003;Unknown</td>
<td valign="top" align="center">2</td>
<td valign="top" align="center">2</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;HDL</td>
<td valign="top" align="center">1.31 (1.15, 1.52)</td>
<td valign="top" align="center">1.29 (1.13, 1.49)</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;&#x2003;Unknown</td>
<td valign="top" align="center">2</td>
<td valign="top" align="center">2</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;TC</td>
<td valign="top" align="center">5.26 (4.65, 5.91)</td>
<td valign="top" align="center">5.42 (4.74, 6.16)</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;&#x2003;Unknown</td>
<td valign="top" align="center">2</td>
<td valign="top" align="center">2</td>
</tr>
<tr>
<td valign="top" align="left" colspan="3">Blood pressure</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;SBP</td>
<td valign="top" align="center">120 (109, 131)</td>
<td valign="top" align="center">133 (121, 146)</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;&#x2003;Unknown</td>
<td valign="top" align="center">18</td>
<td valign="top" align="center">11</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;DBP</td>
<td valign="top" align="center">79 (73, 86)</td>
<td valign="top" align="center">82 (75, 89)</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;&#x2003;Unknown</td>
<td valign="top" align="center">18</td>
<td valign="top" align="center">11</td>
</tr>
<tr>
<td valign="top" align="left" colspan="3">Medical history</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Hypertension</td>
<td valign="top" align="center">100 (15&#x0025;)</td>
<td valign="top" align="center">330 (38&#x0025;)</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Dyslipidemia</td>
<td valign="top" align="center">116 (18&#x0025;)</td>
<td valign="top" align="center">264 (30&#x0025;)</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Diabetes</td>
<td valign="top" align="center">29 (4.5&#x0025;)</td>
<td valign="top" align="center">114 (13&#x0025;)</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Cardiac history</td>
<td valign="top" align="center">26 (4.0&#x0025;)</td>
<td valign="top" align="center">109 (13&#x0025;)</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Depression or anxiety</td>
<td valign="top" align="center">124 (19&#x0025;)</td>
<td valign="top" align="center">154 (18&#x0025;)</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Cognitive impairment</td>
<td valign="top" align="center">13 (2.0&#x0025;)</td>
<td valign="top" align="center">19 (2.2&#x0025;)</td>
</tr>
<tr>
<td valign="top" align="left" colspan="3">Family history</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Stroke</td>
<td valign="top" align="center">103 (16&#x0025;)</td>
<td valign="top" align="center">140 (16&#x0025;)</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;&#x2003;Unknown</td>
<td valign="top" align="center">0</td>
<td valign="top" align="center">1</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Coronary heart disease</td>
<td valign="top" align="center">65 (10&#x0025;)</td>
<td valign="top" align="center">105 (12&#x0025;)</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;&#x2003;Unknown</td>
<td valign="top" align="center">0</td>
<td valign="top" align="center">1</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Hypertension</td>
<td valign="top" align="center">245 (38&#x0025;)</td>
<td valign="top" align="center">325 (37&#x0025;)</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;&#x2003;Unknown</td>
<td valign="top" align="center">0</td>
<td valign="top" align="center">1</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Diabetes</td>
<td valign="top" align="center">106 (16&#x0025;)</td>
<td valign="top" align="center">109 (13&#x0025;)</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;&#x2003;Unknown</td>
<td valign="top" align="center">0</td>
<td valign="top" align="center">1</td>
</tr>
<tr>
<td valign="top" align="left" colspan="3">Health status</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;BMI</td>
<td valign="top" align="center">23.2 (21.5, 25.2)</td>
<td valign="top" align="center">23.8 (21.8, 25.8)</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;&#x2003;Unknown</td>
<td valign="top" align="center">16</td>
<td valign="top" align="center">14</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Central obesity</td>
<td valign="top" align="center">323 (50&#x0025;)</td>
<td valign="top" align="center">592 (68&#x0025;)</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Smoking</td>
<td valign="top" align="center">76 (12&#x0025;)</td>
<td valign="top" align="center">159 (18&#x0025;)</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;&#x2003;Unknown</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">2</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Drinking</td>
<td valign="top" align="center">103 (16&#x0025;)</td>
<td valign="top" align="center">204 (24&#x0025;)</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;&#x2003;Unknown</td>
<td valign="top" align="center">2</td>
<td valign="top" align="center">3</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Sleep</td>
<td valign="top" align="center">357 (56&#x0025;)</td>
<td valign="top" align="center">492 (57&#x0025;)</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;&#x2003;Unknown</td>
<td valign="top" align="center">10</td>
<td valign="top" align="center">6</td>
</tr>
<tr>
<td valign="top" align="left" colspan="3">Lifestyle factors</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Living alone</td>
<td valign="top" align="center">23 (3.6&#x0025;)</td>
<td valign="top" align="center">44 (5.1&#x0025;)</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;&#x2003;Unknown</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">3</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Sport levels</td>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
</tr>
<tr>
<td valign="top" align="left">&#x2003;&#x2003;Lack of physical activity</td>
<td valign="top" align="center">270 (50&#x0025;)</td>
<td valign="top" align="center">355 (47&#x0025;)</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;&#x2003;Frequent physical activity</td>
<td valign="top" align="center">270 (50&#x0025;)</td>
<td valign="top" align="center">393 (53&#x0025;)</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;&#x2003;Unknown</td>
<td valign="top" align="center">106</td>
<td valign="top" align="center">121</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Housework Level</td>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
</tr>
<tr>
<td valign="top" align="left">&#x2003;&#x2003;No</td>
<td valign="top" align="center">37 (6.3&#x0025;)</td>
<td valign="top" align="center">73 (9.0&#x0025;)</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;&#x2003;Occasionally</td>
<td valign="top" align="center">46 (7.8&#x0025;)</td>
<td valign="top" align="center">68 (8.4&#x0025;)</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;&#x2003;30&#x2005;min_perday</td>
<td valign="top" align="center">35 (5.9&#x0025;)</td>
<td valign="top" align="center">55 (6.8&#x0025;)</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;&#x2003;30&#x2005;min&#x2013;1&#x2005;h_perday</td>
<td valign="top" align="center">90 (15&#x0025;)</td>
<td valign="top" align="center">130 (16&#x0025;)</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;&#x2003;1&#x2013;3&#x2005;h_perday</td>
<td valign="top" align="center">243 (41&#x0025;)</td>
<td valign="top" align="center">307 (38&#x0025;)</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;&#x2003;4&#x2005;h_perday</td>
<td valign="top" align="center">140 (24&#x0025;)</td>
<td valign="top" align="center">180 (22&#x0025;)</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;&#x2003;Unknown</td>
<td valign="top" align="center">55</td>
<td valign="top" align="center">56</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Mutual action</td>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
</tr>
<tr>
<td valign="top" align="left">&#x2003;&#x2003;Virtually none</td>
<td valign="top" align="center">221 (39&#x0025;)</td>
<td valign="top" align="center">299 (38&#x0025;)</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;&#x2003;1&#x2013;2days_perweek</td>
<td valign="top" align="center">214 (38&#x0025;)</td>
<td valign="top" align="center">278 (35&#x0025;)</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;&#x2003;3&#x2013;5days_perweek</td>
<td valign="top" align="center">85 (15&#x0025;)</td>
<td valign="top" align="center">138 (17&#x0025;)</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;&#x2003;6&#x2013;7days_perweek</td>
<td valign="top" align="center">46 (8.1&#x0025;)</td>
<td valign="top" align="center">80 (10&#x0025;)</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;&#x2003;Unknown</td>
<td valign="top" align="center">80</td>
<td valign="top" align="center">74</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn id="table-fn1"><label><sup>a</sup></label><p><italic>n</italic> (&#x0025;); Median (IQR); &#x201C;unknown&#x201D; indicates missing values.</p></fn>
</table-wrap-foot>
</table-wrap>
<p>It is essential to note that the primary aim of this study was focused on the prevention and management of stroke. All examination procedures were provided free of charge, and participants had the option to voluntarily undergo testing, ensuring that the study adhered to ethical standards and obtained informed consent from the participants.</p>
</sec>
<sec id="s2b"><title>Utilizing high-resolution ultrasound to assess CAS</title>
<p>An examination was conducted with the patient supine with the head slightly extended. Carotid intima media thickness (IMT) was evaluated with a 7.5&#x2005;MHz linear array transducer using a LOGIO E ultrasound (GE healthcare, USA). Measurements were taken carefully, analyzing the maximum IMT at two sites and all interfaces of the near and far walls of the common carotid artery (CCA), located 1&#x2013;1.5&#x2005;cm below its bifurcation. To obtain anechoic images, adjustments the image gain, depth, and focus were meticulously made for each participant. Plaques were defined as a focal thickening extending into the lumen by at least 0.5&#x2005;mm or as IMTs greater than 1.5&#x2005;mm, measured between the near- and far-walls of any carotid segment in the internal carotid artery, common carotid arteries, and carotid bulb. Carotid artery (CA) was defined as having a maximal intima-media thickness (IMT) of &#x2265;1.0&#x2005;mm and/or the presence of atherosclerotic plaques. To minimize intra-operator variation, a single experienced sonographer conducted all ultrasound examinations.</p>
</sec>
<sec id="s2c"><title>A comprehensive approach to machine learning modeling and evaluation</title>
<p>The analytical approach employed in this study leveraged R code to perform several critical steps. To address missing data, the &#x201C;missRanger&#x201D; package was utilized for imputing missing values. Subsequently, a diverse set of machine learning models, encompassing support vector machines (SVM), XGBoost, decision trees, random forests, and logistic regression, were employed. Hyperparameter tuning was conducted through random search to identify the optimal model configuration. To ensure robust model performance while mitigating overfitting, a 5-fold cross-validation strategy was implemented. Given the presence of imbalanced target classes, data balance was achieved through oversampling. Model performance evaluation primarily relied on the area under the curve (AUC) metric, facilitating the selection of the best-performing machine learning method as the final model.</p>
<p>In the final model evaluation, three key approaches were employed: (1) ROC and PRC (Precision-Recall Curve) plots provided in-depth insights into model performance. (2) Model calibration was conducted using the calibration function from the &#x201C;calibrate&#x201D; package. This process involved generating calibration plots for apparent and bias-corrected probabilities to comprehensively assess model performance. (3) Decision Curve Analysis (DCA) was carried out to evaluate the clinical utility of the model. Decision curves and the plot_decision_curve function were employed to visualize the net benefit of the model across various threshold probabilities.</p>
<p>Additionally, a forest plot was created using the forest_model function from the &#x201C;forestmodel&#x201D; package, offering deeper insights into the relationship between predictor variables and the outcome variable. Sample size calculation was executed using the ShowRegTable function, contributing to an understanding of dataset characteristics and ensuring an adequate sample size for the analysis.</p>
<p>In summary, this methodological approach comprised data imputation, machine learning modeling, hyperparameter tuning, cross-validation, data balancing, and comprehensive model performance evaluation, culminating in the selection of the best-performing model. The final model evaluation involved ROC and PRC plots, model calibration, Decision Curve Analysis, and a forest plot. Sample size calculations were conducted to support the robustness of the analysis.</p>
</sec>
<sec id="s2d"><title>Developing a risk scoring system</title>
<p>Grouping and Reference Value Selection of Risk Factors: Firstly, risk factors are grouped based on their clinical significance or common usage. In each group, appropriate numerical values are selected as reference values (Wij). Typically, the midpoint of the group is chosen as the reference value. Secondly, Handling Categorical Variables: For categorical variables such as gender, a category is chosen as the reference, and its reference value is set to 0, while other categories are naturally assigned numerical values, typically 1. Basic Risk Reference Value: Each risk factor needs to have a suitable group selected as the basic risk reference value (WiREF). When constructing a scoring tool later, the score for this group will be set as 0. Scores for other groups will be assigned positive or negative values based on their relationship with WiREF. Scoring Calculation: Using the regression coefficients estimated by a multiple logistic regression model (<italic>&#x03B2;</italic>i) and the reference values for each risk factor group (Wij), the distance between each risk factor&#x0027;s group and the basic risk reference value (WiREF) is calculated (D). The calculation formula is D&#x2009;&#x003D;&#x2009;(Wij&#x2212;WiREF) &#x002A; <italic>&#x03B2;</italic>i. Thirdly, Risk Probability Calculation: Using the equation of a multiple logistic regression model, the probability of risk prediction <inline-formula><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="IM1"><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mrow><mml:mover><mml:mrow><mml:mspace width="thinmathspace" /><mml:mi>p</mml:mi></mml:mrow><mml:mo>&#x005E;</mml:mo></mml:mover></mml:mrow></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:math></inline-formula> for each score is calculated. This probability value represents the likelihood of an individual experiencing a specific event under certain risk factors. The formula is:<disp-formula><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="UDM1"><mml:mrow><mml:mover><mml:mrow><mml:mspace width="thinmathspace" /><mml:mi>p</mml:mi></mml:mrow><mml:mo>&#x005E;</mml:mo></mml:mover></mml:mrow><mml:mo>=</mml:mo><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mfrac><mml:mn>1</mml:mn><mml:mrow><mml:mn>1</mml:mn><mml:mo>+</mml:mo><mml:mi>exp</mml:mi><mml:mo>&#x2061;</mml:mo><mml:mrow><mml:mo>(</mml:mo><mml:mrow><mml:mo>&#x2212;</mml:mo><mml:msubsup><mml:mo movablelimits="false">&#x2211;</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>0</mml:mn></mml:mrow><mml:mi>p</mml:mi></mml:msubsup><mml:mrow><mml:mi>&#x03B2;</mml:mi><mml:mi>i</mml:mi><mml:mi>X</mml:mi><mml:mi>i</mml:mi></mml:mrow></mml:mrow><mml:mo>)</mml:mo></mml:mrow></mml:mrow></mml:mfrac></mml:mrow><mml:mo>,</mml:mo></mml:mstyle></mml:math></disp-formula>where <inline-formula><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="IM2"><mml:msubsup><mml:mo movablelimits="false">&#x2211;</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>0</mml:mn></mml:mrow><mml:mi>p</mml:mi></mml:msubsup><mml:mrow><mml:mi>&#x03B2;</mml:mi><mml:mi>i</mml:mi><mml:mi>X</mml:mi><mml:mi>i</mml:mi></mml:mrow></mml:math></inline-formula> represents a linear combination, which is approximately a constant term added to the product of the scores for various risk factors. Analyses were conducted using the R Statistical language (version 4.3.1; R Core Team, 2023).</p>
</sec>
</sec>
<sec id="s3" sec-type="results"><title>Results</title>
<sec id="s3a"><title>Population characteristics</title>
<p>Initially, 1,560 participants were recruited; however, 45 individuals with incomplete carotid ultrasound examinations were excluded from analysis. Consequently, the final analytical sample comprised 1,515 subjects. Carotid ultrasound revealed CAS in 869 participants, constituting a prevalence of 57.4&#x0025; in the study cohort. Individuals in the CAS group demonstrated more advanced age compared to the non-CAS group (mean 63 years vs. 54 years). Additionally, the majority of CAS individuals were female (519 subjects, accounting for prevalence of 60&#x0025;). Detailed demographic information for the entire study population is presented in <xref ref-type="table" rid="T1">Table&#x00A0;1</xref>.</p>
</sec>
<sec id="s3b"><title>Machine learning model training and evaluation process</title>
<p>The preprocessing phase involved imputing missing values to ensure a complete dataset, as depicted in <xref ref-type="fig" rid="F1">Figure&#x00A0;1</xref>. Subsequently, five machine learning models were explored, including logistic regression, support vector machines (SVM), XGBoost, decision trees and random forests. Hyperparameter optimization was carried out through random search across defined parameter spaces for each algorithm. To mitigate class imbalance, the &#x201C;oversample&#x201D; method from the classbalancing package was utilized, equalizing the training set&#x0027;s target categories. For imbalanced classification, the area under the receiver operating characteristic curve (AUC) served as a robust metric of overall performance. As shown in <xref ref-type="fig" rid="F2">Figure&#x00A0;2</xref>, the ROC curves described each learner&#x0027;s discrimination capacity across thresholds, with the AUC score quantifying overall predictive power.</p>
<fig id="F1" position="float"><label>Figure 1</label>
<caption><p>Missing data aggregation plot. On the left, the distribution of missing data is depicted as a percentage. On the right, a missing pattern analysis (aggregation missingness plot using the VIM package) is presented, showcasing the percentages of different missing patterns. 79&#x0025; of the entire study population had no missing values.</p></caption>
<graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="fcvm-11-1392752-g001.tif"/>
</fig>
<fig id="F2" position="float"><label>Figure 2</label>
<caption><p>AUC and ROC comparisons for imbalanced classification learners. The figure illustrates the AUC (<bold>A</bold>) and ROC (<bold>B</bold>) comparisons for different learners in the context of imbalanced classification problems. Each learner is represented by a distinct color. The AUC/ROC value, denoted in the legend, quantify the overall classification performance of each learner. The higher the AUC/ROC, the better the learner&#x0027;s ability to distinguish between classes. This set of machine learning pipelines (scale.oversample.classif.log_reg, scale.oversample.classif.svm, scale.oversample.classif.xgboost, scale.oversample.classif.rpart, scale.oversample.classif.ranger) is designed to tackle imbalanced classification problems. Firstly, by scaling features, the data is normalized to enhance the robustness of the classification algorithms. Secondly, to address class imbalance, oversampling techniques are applied to augment the number of samples in the minority class. Finally, each pipeline employs a different classifier, such as logistic regression, support vector machine, XGBoost, recursive partitioning trees (rpart), and Ranger random forest, to accomplish the ultimate classification task. This integrated framework aims to improve the model&#x0027;s ability to handle imbalanced data, thereby enhancing the overall performance of the classification algorithms. AUC, area under the curve; ROC, receiver operating characteristic curve.</p></caption>
<graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="fcvm-11-1392752-g002.tif"/>
</fig>
<p>Simultaneously, the AUC values for each learner on the training set were computed and visually represented in the figure. The outcomes of different machine learning algorithms on the training and test sets were summarized in <xref ref-type="table" rid="T2">Table&#x00A0;2</xref>. Remarkably high accuracy levels (79&#x0025;&#x2013;100&#x0025;) were achieved by all classifiers during the training phase. However, when applied to the test set, the overall accuracy dropped to 75&#x0025;. Notably, an accuracy of 82&#x0025; was achieved by the logistic classifier, outperforming its counterparts. This discrepancy underscores potential challenges in the model&#x0027;s generalization to unseen data, with the logistic regression model exhibiting greater robustness during the transition from training to testing phases. Therefore, the logistic regression model (<xref ref-type="fig" rid="F3">Figure&#x00A0;3</xref>) was selected as the final model, incorporating six variables: age, systolic pressure, hypertension, total cholesterol, HDL cholesterol, and sex. Based on these six variables, the model was named the AP2C2S model. Specifically, age showed a significant positive correlation with CAS (OR&#x2009;&#x003D;&#x2009;1.14, 95&#x0025; CI: 1.13&#x2013;1.16, <italic>P</italic>&#x2009;&#x003C;&#x2009;0.001), while systolic pressure also demonstrated a positive correlation (OR&#x2009;&#x003D;&#x2009;1.02, 95&#x0025; CI: 1.01&#x2013;1.02, <italic>P</italic>&#x2009;&#x003C;&#x2009;0.001). Conversely, high-density lipoprotein (HDL) exhibited a significant negative correlation with CAS (OR&#x2009;&#x003D;&#x2009;0.30, 95&#x0025; CI: 0.17&#x2013;0.50, <italic>P</italic>&#x2009;&#x003C;&#x2009;0.001), indicating its role as a protective factor against CAS. Additionally, total cholesterol (TC) showed a positive correlation with CAS (OR&#x2009;&#x003D;&#x2009;1.58, 95&#x0025; CI: 1.35&#x2013;1.86, <italic>P</italic>&#x2009;&#x003C;&#x2009;0.001). Gender, when treated as a categorical variable, was significantly associated with CAS, with males showing a higher risk (OR&#x2009;&#x003D;&#x2009;2.09, 95&#x0025; CI: 1.57&#x2013;2.80, <italic>P</italic>&#x2009;&#x003C;&#x2009;0.001). Moreover, individuals with a history of hypertension exhibited a significant positive correlation with CAS (OR&#x2009;&#x003D;&#x2009;1.53, 95&#x0025; CI: 1.11&#x2013;2.11, <italic>P</italic>&#x2009;&#x003D;&#x2009;0.009). These findings underscore the significance of these variables in predicting CAS risk and justify their inclusion in the AP2C2S model.</p>
<table-wrap id="T2" position="float"><label>Table 2</label>
<caption><p>Comparison of the performance of machine learning classifiers.</p></caption>
<table frame="hsides" rules="groups">
<colgroup>
<col align="left"/>
<col align="center"/>
<col align="center"/>
<col align="center"/>
<col align="center"/>
<col align="center"/>
<col align="center"/>
</colgroup>
<thead>
<tr>
<th valign="top" align="left">Learner</th>
<th valign="top" align="center">Area under the curve training set</th>
<th valign="top" align="center">Area under the curve test set</th>
<th valign="top" align="center">Sensitivity</th>
<th valign="top" align="center">Specificity</th>
<th valign="top" align="center">False negative rate</th>
<th valign="top" align="center">False positive rate</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Logistic regression</td>
<td valign="top" align="center">0.8505827</td>
<td valign="top" align="center">0.8208542</td>
<td valign="top" align="center">0.8216663</td>
<td valign="top" align="center">0.6595230</td>
<td valign="top" align="center">0.1783337</td>
<td valign="top" align="center">0.3404770</td>
</tr>
<tr>
<td valign="top" align="left">Support vector machines</td>
<td valign="top" align="center">0.9395673</td>
<td valign="top" align="center">0.8061250</td>
<td valign="top" align="center">0.8365956</td>
<td valign="top" align="center">0.6162075</td>
<td valign="top" align="center">0.1634044</td>
<td valign="top" align="center">0.3837925</td>
</tr>
<tr>
<td valign="top" align="left">XGBoost</td>
<td valign="top" align="center">1.0000000</td>
<td valign="top" align="center">0.7876161</td>
<td valign="top" align="center">0.8043851</td>
<td valign="top" align="center">0.6269529</td>
<td valign="top" align="center">0.1956149</td>
<td valign="top" align="center">0.3730471</td>
</tr>
<tr>
<td valign="top" align="left">Decision trees</td>
<td valign="top" align="center">0.7886977</td>
<td valign="top" align="center">0.7631142</td>
<td valign="top" align="center">0.8412331</td>
<td valign="top" align="center">0.5975671</td>
<td valign="top" align="center">0.1587669</td>
<td valign="top" align="center">0.4024329</td>
</tr>
<tr>
<td valign="top" align="left">Random forests</td>
<td valign="top" align="center">0.9995162</td>
<td valign="top" align="center">0.8145973</td>
<td valign="top" align="center">0.8596306</td>
<td valign="top" align="center">0.6207752</td>
<td valign="top" align="center">0.1403694</td>
<td valign="top" align="center">0.3792248</td>
</tr>
<tr>
<td valign="top" align="left">Scale.oversample.classif.log_reg</td>
<td valign="top" align="center">0.8495273</td>
<td valign="top" align="center">0.8218000</td>
<td valign="top" align="center">0.7595176</td>
<td valign="top" align="center">0.7214073</td>
<td valign="top" align="center">0.2404824</td>
<td valign="top" align="center">0.2785927</td>
</tr>
<tr>
<td valign="top" align="left">Scale.oversample.classif.svm</td>
<td valign="top" align="center">0.9466890</td>
<td valign="top" align="center">0.7996170</td>
<td valign="top" align="center">0.7871304</td>
<td valign="top" align="center">0.6672630</td>
<td valign="top" align="center">0.2128696</td>
<td valign="top" align="center">0.3327370</td>
</tr>
<tr>
<td valign="top" align="left">Scale.oversample.classif.xgboost</td>
<td valign="top" align="center">1.0000000</td>
<td valign="top" align="center">0.7943870</td>
<td valign="top" align="center">0.8020730</td>
<td valign="top" align="center">0.6502087</td>
<td valign="top" align="center">0.1979270</td>
<td valign="top" align="center">0.3497913</td>
</tr>
<tr>
<td valign="top" align="left">Scale.oversample.classif.rpart</td>
<td valign="top" align="center">0.7904094</td>
<td valign="top" align="center">0.7518600</td>
<td valign="top" align="center">0.7676433</td>
<td valign="top" align="center">0.6703518</td>
<td valign="top" align="center">0.2323567</td>
<td valign="top" align="center">0.3296482</td>
</tr>
<tr>
<td valign="top" align="left">Scale.oversample.classif.ranger</td>
<td valign="top" align="center">0.9996804</td>
<td valign="top" align="center">0.8163943</td>
<td valign="top" align="center">0.8366222</td>
<td valign="top" align="center">0.6718664</td>
<td valign="top" align="center">0.1633778</td>
<td valign="top" align="center">0.3281336</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn id="table-fn2"><p>This set of machine learning pipelines (&#x201C;scale.oversample.classif.log_reg&#x201D;, &#x201C;scale.oversample.classif.svm&#x201D;, &#x201C;scale.oversample.classif.xgboost&#x201D;, &#x201C;scale.oversample.classif.rpart&#x201D;, &#x201C;scale.oversample.classif.ranger&#x201D;) corresponds to different classifiers such as logistic regression, support vector machine, XGBoost, recursive partitioning tree (rpart), and Ranger random forest, aimed at accomplishing the final classification task. The ensemble framework is designed to enhance the model&#x0027;s ability to handle imbalanced data, thereby improving the overall performance of the classification algorithm.</p></fn>
</table-wrap-foot>
</table-wrap>
<fig id="F3" position="float"><label>Figure 3</label>
<caption><p>Forest plot showing logistic regression multivariate analysis of CAS.</p></caption>
<graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="fcvm-11-1392752-g003.tif"/>
</fig>
<p>Expanding upon our analysis, we extracted the regression model and generated ROC and PRC curves (<xref ref-type="fig" rid="F4">Figures&#x00A0;4A,B</xref>) to further assess the model. We performed consistency checks using the calibrate function and depicted the calibration curve (<xref ref-type="fig" rid="F4">Figure&#x00A0;4C</xref>). Additionally, employing decision curve analysis allowed us to assess patient benefits at different thresholds, providing insights into the model&#x0027;s potential value in real clinical decision-making (<xref ref-type="fig" rid="F4">Figure&#x00A0;4D</xref>). This series of analyses and evaluations contributes to a thorough understanding of the model&#x0027;s performance and applicability.</p>
<fig id="F4" position="float"><label>Figure 4</label>
<caption><p>Model performance for CAS prediction. (<bold>A</bold>) Receiver-operating characteristics (ROC) and (<bold>B</bold>) precision recall curve (PRC) plots for the predictive model (AP2C2S model) for discrimination of patients with carotid atherosclerosis in the multiple community populations. The 95&#x0025; CIs of precision and sensitivity are shown as pink ribbons in the PRC and ROC curves, respectively. (<bold>C</bold>) Calibration curve for the AP2C2S model. The plot shows the agreement between predictions from the model and what was actually observed. (<bold>D</bold>) Decision curve analysis for the AP2C2S model. The net benefit (y-axis) is the net proportion of community populations with CAS who, based on the decision strategy, would correctly be recommended further intervention at the same rate that populations with non-CAS would not be recommended further screening. The threshold probability (x-axis) indicates the range of predicted risk levels above which patients and their physicians might opt for further screening. The gray and black lines (horizontal) represent the scenarios where all or none of the community populations would be prospectively determined by the AP2C2S model, respectively. The red line demonstrates the net benefit of the risk model dependent at the chosen risk threshold. The accompanying thinner lines represent the 95&#x0025; confidence intervals.</p></caption>
<graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="fcvm-11-1392752-g004.tif"/>
</fig>
</sec>
<sec id="s3c"><title>Development of a risk scoring tool (AP2C2S)</title>
<p>Firstly, we categorized the variables of the final model as per the methodology section, assigning values to each variable based on the description provided (refer to <xref ref-type="table" rid="T3">Table&#x00A0;3</xref>). Subsequently, utilizing the equation of the multiple logistic regression model, we calculated the risk prediction probability for each corresponding score. Through this iterative process, we established a comprehensive table illustrating the correspondence between total scores and risk prediction probabilities, as depicted in <xref ref-type="table" rid="T4">Table&#x00A0;4</xref>.</p>
<table-wrap id="T3" position="float"><label>Table 3</label>
<caption><p>Development of a risk factor scoring tool using multifactor logistic regression.</p></caption>
<table frame="hsides" rules="groups">
<colgroup>
<col align="left"/>
<col align="center"/>
<col align="center"/>
<col align="center"/>
<col align="center"/>
<col align="center"/>
</colgroup>
<thead>
<tr>
<th valign="top" align="left">Factors</th>
<th valign="top" align="center">Categories</th>
<th valign="top" align="center">Reference value (<italic>Wij</italic>)</th>
<th valign="top" align="center"><italic>&#x03B2;</italic>i</th>
<th valign="top" align="center"><italic>&#x03B2;i</italic> (<italic>Wij&#x2212;WiREF</italic>)</th>
<th valign="top" align="center"><italic>Pointsij&#x2009;&#x003D;&#x2009;D/B&#x2009;&#x003D;&#x2009;(Wij&#x2212;WiREF) &#x002A; &#x03B2;i/B</italic></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left" rowspan="6">Age</td>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
<td valign="top" align="center">0.127</td>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
</tr>
<tr>
<td valign="top" align="center">35&#x2013;44</td>
<td valign="top" align="center">39.5&#x2009;&#x003D;&#x2009;W1REF</td>
<td valign="top" align="center"/>
<td valign="top" align="center">0</td>
<td valign="top" align="center">0</td>
</tr>
<tr>
<td valign="top" align="center">45&#x2013;54</td>
<td valign="top" align="center">49.5</td>
<td valign="top" align="center"/>
<td valign="top" align="center">1.27</td>
<td valign="top" align="center">4</td>
</tr>
<tr>
<td valign="top" align="center">55&#x2013;64</td>
<td valign="top" align="center">59.5</td>
<td valign="top" align="center"/>
<td valign="top" align="center">2.54</td>
<td valign="top" align="center">8</td>
</tr>
<tr>
<td valign="top" align="center">65&#x2013;74</td>
<td valign="top" align="center">69.5</td>
<td valign="top" align="center"/>
<td valign="top" align="center">3.81</td>
<td valign="top" align="center">12</td>
</tr>
<tr>
<td valign="top" align="center">&#x2265;75</td>
<td valign="top" align="center">78.5</td>
<td valign="top" align="center"/>
<td valign="top" align="center">4.953</td>
<td valign="top" align="center">15</td>
</tr>
<tr>
<td valign="top" align="left" rowspan="7">SBP</td>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
<td valign="top" align="center">0.022</td>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
</tr>
<tr>
<td valign="top" align="center">&#x003C;120</td>
<td valign="top" align="center">107</td>
<td valign="top" align="center"/>
<td valign="top" align="center">&#x2212;0.396</td>
<td valign="top" align="center">&#x2212;1</td>
</tr>
<tr>
<td valign="top" align="center">120&#x2013;129</td>
<td valign="top" align="center">125&#x2009;&#x003D;&#x2009;W2REF</td>
<td valign="top" align="center"/>
<td valign="top" align="center">0</td>
<td valign="top" align="center">0</td>
</tr>
<tr>
<td valign="top" align="center">130&#x2013;139</td>
<td valign="top" align="center">135</td>
<td valign="top" align="center"/>
<td valign="top" align="center">0.22</td>
<td valign="top" align="center">1</td>
</tr>
<tr>
<td valign="top" align="center">140&#x2013;149</td>
<td valign="top" align="center">145</td>
<td valign="top" align="center"/>
<td valign="top" align="center">0.44</td>
<td valign="top" align="center">1</td>
</tr>
<tr>
<td valign="top" align="center">150&#x2013;159</td>
<td valign="top" align="center">155</td>
<td valign="top" align="center"/>
<td valign="top" align="center">0.66</td>
<td valign="top" align="center">2</td>
</tr>
<tr>
<td valign="top" align="center">&#x2265;160</td>
<td valign="top" align="center">170</td>
<td valign="top" align="center"/>
<td valign="top" align="center">0.99</td>
<td valign="top" align="center">3</td>
</tr>
<tr>
<td valign="top" align="left" rowspan="5">HDL</td>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
<td valign="top" align="center">&#x2212;1.28</td>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
</tr>
<tr>
<td valign="top" align="center">&#x003C;1.14</td>
<td valign="top" align="center">0.99</td>
<td valign="top" align="center"/>
<td valign="top" align="center">0.2944</td>
<td valign="top" align="center">1</td>
</tr>
<tr>
<td valign="top" align="center">1.14&#x2013;1.29</td>
<td valign="top" align="center">1.22&#x2009;&#x003D;&#x2009;W3REF</td>
<td valign="top" align="center"/>
<td valign="top" align="center">0</td>
<td valign="top" align="center">0</td>
</tr>
<tr>
<td valign="top" align="center">1.30&#x2013;1.50</td>
<td valign="top" align="center">1.40</td>
<td valign="top" align="center"/>
<td valign="top" align="center">&#x2212;0.2304</td>
<td valign="top" align="center">&#x2212;1</td>
</tr>
<tr>
<td valign="top" align="center">&#x2265;1.51</td>
<td valign="top" align="center">1.89</td>
<td valign="top" align="center"/>
<td valign="top" align="center">&#x2212;0.8576</td>
<td valign="top" align="center">&#x2212;3</td>
</tr>
<tr>
<td valign="top" align="left" rowspan="5">TC</td>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
<td valign="top" align="center">0.55</td>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
</tr>
<tr>
<td valign="top" align="center">&#x003C;4.70</td>
<td valign="top" align="center">3.98&#x2009;&#x003D;&#x2009;W4REF</td>
<td valign="top" align="center"/>
<td valign="top" align="center">0</td>
<td valign="top" align="center">0</td>
</tr>
<tr>
<td valign="top" align="center">4.70&#x2013;5.33</td>
<td valign="top" align="center">5.02</td>
<td valign="top" align="center"/>
<td valign="top" align="center">0.572</td>
<td valign="top" align="center">2</td>
</tr>
<tr>
<td valign="top" align="center">5.34&#x2013;6.04</td>
<td valign="top" align="center">5.69</td>
<td valign="top" align="center"/>
<td valign="top" align="center">0.9405</td>
<td valign="top" align="center">3</td>
</tr>
<tr>
<td valign="top" align="center">&#x2265;6.05</td>
<td valign="top" align="center">7.23</td>
<td valign="top" align="center"/>
<td valign="top" align="center">1.7875</td>
<td valign="top" align="center">5</td>
</tr>
<tr>
<td valign="top" align="left" rowspan="3">Sex</td>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
<td valign="top" align="center">0.88</td>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
</tr>
<tr>
<td valign="top" align="center">Female</td>
<td valign="top" align="center">0&#x2009;&#x003D;&#x2009;W5REF</td>
<td valign="top" align="center"/>
<td valign="top" align="center">0</td>
<td valign="top" align="center">0</td>
</tr>
<tr>
<td valign="top" align="center">Male</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center"/>
<td valign="top" align="center">0.88</td>
<td valign="top" align="center">3</td>
</tr>
<tr>
<td valign="top" align="left" rowspan="3">Hypertension</td>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
<td valign="top" align="center">0.39</td>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
</tr>
<tr>
<td valign="top" align="center">No</td>
<td valign="top" align="center">0&#x2009;&#x003D;&#x2009;W6REF</td>
<td valign="top" align="center"/>
<td valign="top" align="center">0</td>
<td valign="top" align="center">0</td>
</tr>
<tr>
<td valign="top" align="center">Yes</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center"/>
<td valign="top" align="center">0.39</td>
<td valign="top" align="center">1</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn id="table-fn3"><p>HDL, high-density lipoprotein; SBP, systolic blood pressure; TC, total cholesterol.</p></fn>
<fn id="table-fn4"><p>Wij (Reference Value of Risk Factor Group): Represents the reference value of the j-th category of the i-th risk factor group. Typically, the median of this category is selected as the reference value. WiREF (Basic Risk Reference Value): Represents the baseline risk reference value of the i-th risk factor. When constructing the scoring tool, an appropriate group is selected as WiREF, with its score set to 0. Other groups receive positive or negative scores based on their relationship with WiREF. Risk Score Calculation: Utilizes the regression coefficients &#x03B2;i estimated by a multiple logistic regression model and the reference values Wij of each risk factor group to calculate the distance D between each group and the baseline WiREF. The formula is as follows: D&#x2009;&#x003D;&#x2009;(Wij - WiREF) &#x002A; &#x03B2;i. The score for each risk factor (Pointsij) represents the calculation derived from the multiple logistic regression model, indicating the score of the ith risk factor in the jth category. This score is based on the difference between the reference value (Wij) and the baseline risk reference value (WiREF) of that category, multiplied by the regression coefficient (&#x03B2;i) of the risk factor, and divided by a constant (B). This constant, B, is utilized to convert the units of the regression coefficients into scores, ensuring consistency in the use of scores within the risk scoring system.</p></fn>
</table-wrap-foot>
</table-wrap>
<table-wrap id="T4" position="float"><label>Table 4</label>
<caption><p>The correspondence table between total score and risk prediction probability.</p></caption>
<table frame="hsides" rules="groups">
<colgroup>
<col align="left"/>
<col align="center"/>
<col align="char"/>
<col align="char"/>
<col align="char"/>
<col align="char"/>
</colgroup>
<thead>
<tr>
<th valign="top" align="left">Point total</th>
<th valign="top" align="center">Estimate of risk</th>
<th valign="top" align="center">Point total</th>
<th valign="top" align="center">Estimate of risk</th>
<th valign="top" align="center">Point total</th>
<th valign="top" align="center">Estimate of risk</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">&#x2212;1</td>
<td valign="top" align="center">0.88195759</td>
<td valign="top" align="center">9</td>
<td valign="top" align="center">0.452914929</td>
<td valign="top" align="center">19</td>
<td>0.084023053</td>
</tr>
<tr>
<td valign="top" align="left">0</td>
<td>0.857062087</td>
<td>10</td>
<td>0.39917591</td>
<td>20</td>
<td>0.068567823</td>
</tr>
<tr>
<td valign="top" align="left">1</td>
<td>0.827940365</td>
<td>11</td>
<td>0.347760001</td>
<td>21</td>
<td>0.055782307</td>
</tr>
<tr>
<td valign="top" align="left">2</td>
<td>0.794309407</td>
<td>12</td>
<td>0.299663659</td>
<td>22</td>
<td>0.045264987</td>
</tr>
<tr>
<td valign="top" align="left">3</td>
<td>0.756041843</td>
<td>13</td>
<td>0.25561233</td>
<td>23</td>
<td>0.03665365</td>
</tr>
<tr>
<td valign="top" align="left">4</td>
<td>0.713225204</td>
<td>14</td>
<td>0.216039055</td>
<td>24</td>
<td>0.029629715</td>
</tr>
<tr>
<td valign="top" align="left">5</td>
<td>0.666211583</td>
<td>15</td>
<td>0.18110187</td>
<td>25</td>
<td>0.023918357</td>
</tr>
<tr>
<td valign="top" align="left">6</td>
<td>0.615644079</td>
<td>16</td>
<td>0.150728336</td>
<td>26</td>
<td>0.019286027</td>
</tr>
<tr>
<td valign="top" align="left">7</td>
<td>0.56244723</td>
<td>17</td>
<td>0.124673352</td>
<td>27</td>
<td>0.015536572</td>
</tr>
<tr>
<td valign="top" align="left">8</td>
<td>0.507774373</td>
<td>18</td>
<td>0.102578251</td>
<td>28</td>
<td>0.012506764</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>The seamless integration of this grouping and calculation procedure facilitates a systematic evaluation of each variable&#x0027;s contribution to the final model. It ensures a thorough and precise prediction of risk probability for patients. This methodical approach underscores the scientific rigor and practical utility of our risk assessment model in a clinical context.</p>
<p>To illustrate the application of the AP2C2S risk scoring tool concretely, we provide an example based on <xref ref-type="table" rid="T3">Tables&#x00A0;3</xref>, <xref ref-type="table" rid="T4">4</xref>. Let&#x0027;s consider a 55-year-old male patient with a systolic blood pressure of 135&#x2005;mmHg, total cholesterol (TC) of 5.5&#x2005;mmol/L, high-density lipoprotein (HDL) of 1.2&#x2005;mmol/L, and a history of hypertension. Referring to <xref ref-type="table" rid="T3">Table&#x00A0;3</xref>, we can assign points for each risk factor: Age (55&#x2013;64 years): 8 points; Gender (male): 3 points; SBP (130&#x2013;139 mmHg): 1 point; HDL (1.14&#x2013;1.29&#x2005;mmol/L): 0 points; TC (reference range): 3 points; Hypertension (yes): 1 point. Adding up these points, the patient&#x0027;s baseline total score is 16 points. Next, referring to <xref ref-type="table" rid="T4">Table&#x00A0;4</xref>, we find the corresponding CAS risk prediction probability based on the total score. In this example, a score of 16 corresponds to a risk prediction probability of 15.07&#x0025;.</p>
</sec>
</sec>
<sec id="s4" sec-type="discussion"><title>Discussion</title>
<p>Our study revealed a 57.4&#x0025; prevalence of CAS among 1515 participants, underscoring a significant risk, especially in the middle-aged and elderly population. CAS patients exhibited higher age and positive correlations with traditional cardiovascular risk factors, including systolic blood pressure, age, history of hypertension, male gender, and total cholesterol. Notably, we identified high-density lipoprotein (HDL) as a protective factor against CAS, highlighting its role in risk mitigation. These findings indicate that total cholesterol and HDL levels could serve as significant predictors of CAS in community-dwelling men. This underscores the importance of managing cholesterol and increasing HDL levels to prevent the development of atherosclerosis. Specifically for elderly men with a history of hypertension, early adoption of secondary cardiovascular prevention measures is strongly recommended. Furthermore, leveraging advanced machine learning techniques, such as SVM, XGBoost, decision trees, random forests, and logistic regression, we achieved high accuracy during training (79&#x0025;&#x2013;100&#x0025;). The logistic classifier, with an 82&#x0025; accuracy, exhibited superior robustness in transitioning from training to testing, leading to its selection as the final model. This comprehensive approach enhances our understanding of CAS while providing a practical tool for risk assessment and personalized preventive strategies.</p>
<p>A traditional belief was that HDL particles, known for their role in reverse cholesterol transport, conferred cardiovascular benefits. However, current insights into HDL highlight its role in suppressing inflammation, oxidative stress, and stimulating endothelial function (<xref ref-type="bibr" rid="B11">11</xref>). Additionally, animal studies have indicated that recombinant HDL may inhibit the expression of carotid VCAM-1 (<xref ref-type="bibr" rid="B12">12</xref>) or aortic VCAM-1 and ICAM-1 (<xref ref-type="bibr" rid="B13">13</xref>). HDL has also been demonstrated to reduce the surface expression of ICAM-1, VCAM-1, and E-selectin by activating annexin A1 (<xref ref-type="bibr" rid="B14">14</xref>), a recognized anti-inflammatory mediator. In summary, the collective evidence from experimental models suggests that HDL particles directly influence endothelial cells, inhibiting proteins associated with endothelial activation. This mechanism holds the potential to decelerate the progression of atherosclerosis.</p>
<p>Notably, this study integrates traditional epidemiological analysis with advanced machine learning techniques, culminating in the creation of a practical risk scoring tool. By initially recruiting a substantial sample and utilizing carotid ultrasound to identify atherosclerosis, the research delves into population characteristics, revealing significant associations with demographic factors. The application of machine learning algorithms enhances the study&#x0027;s predictive capabilities, with logistic regression emerging as the most robust model (<xref ref-type="bibr" rid="B15">15</xref>). The incorporation of ROC and PRC curves, calibration checks, and decision curve analysis ensures a thorough evaluation of the model&#x0027;s performance and clinical utility. Additionally, the development of a risk scoring tool (AP2C2S) based on logistic regression results contributes to a systematic and precise assessment of individual risk probabilities. This holistic methodology reflects a novel and integrated approach to investigating and managing CAS, offering valuable insights for both research and clinical applications.</p>
<p>While our study yields valuable insights, certain limitations need consideration. The cross-sectional nature impedes causal inference, necessitating future longitudinal investigations. Additionally, the study&#x0027;s regional focus may impact generalizability, prompting caution in extending findings to broader populations. It is also worth noting that the AP2C2S model has not undergone direct comparison with the Systematic Coronary Risk Evaluation (SCORE) system (<xref ref-type="bibr" rid="B16">16</xref>) or other currently utilized scoring systems for carotid artery disease risk assessment. Therefore, while our findings provide valuable insights into the risk factors associated with carotid atherosclerosis, further research is needed to compare the AP2C2S model with other scoring systems and to validate its predictive accuracy across different demographic groups.</p>
<p>The risk scoring tool developed in this study serves as a foundation for further refinement and validation in diverse populations. Future research could explore additional biomarkers or imaging modalities to enhance risk prediction accuracy. The study sets the stage for evaluating personalized interventions based on risk scores, contributing to targeted and efficient preventive strategies.</p>
<p>Given the prolonged progression of atherosclerosis, our study&#x0027;s &#x201C;preventive strategies&#x201D; aim to achieve two key objectives: primary prevention for identifying high-risk individuals susceptible to cerebrovascular and cardiovascular complications, and secondary prevention targeting existing CAS patients. For primary prevention, our AP2C2S model facilitates the identification of candidates who could benefit from lifestyle modifications and early medical interventions, thereby reducing the risk of stroke. In the realm of secondary prevention, the same model serves as a valuable tool for prioritizing patients requiring heightened surveillance and more aggressive treatment approaches to impede CAS progression.</p>
</sec>
<sec id="s5" sec-type="conclusions"><title>Conclusions</title>
<p>In conclusion, our study unveils a significant prevalence of CAS within the community, especially among the elderly. The introduction of the AP2C2S risk scoring tool, validated through the logistic classifier&#x0027;s robust performance across training and testing phases, offers a refined approach to risk assessment. This tool holds promise for identifying high-risk individuals within community health initiatives, potentially streamlining the process of screening and clinical intervention. By emphasizing the critical role of cholesterol management, particularly high-density lipoprotein (HDL), our research provides actionable insights that could inform CAS prevention strategies. However, we recognize the imperative for rigorous and extensive validation to ensure the tool&#x0027;s practicality and effectiveness in diverse real-world settings.</p>
</sec>
</body>
<back>
<sec id="s6" sec-type="data-availability"><title>Data availability statement</title>
<p>The original contributions presented in the study are included in the article/Supplementary Material, further inquiries can be directed to the corresponding author.</p>
</sec>
<sec id="s7" sec-type="ethics-statement"><title>Ethics statement</title>
<p>The studies involving humans were approved by the Ethical Committee of Guangdong Second Provincial General Hospital. The studies were conducted in accordance with the local legislation and institutional requirements. The participants provided their written informed consent to participate in this study.</p>
</sec>
<sec id="s8" sec-type="author-contributions"><title>Author contributions</title>
<p>Z-XH: Writing &#x2013; review &#x0026; editing, Writing &#x2013; original draft, Supervision, Project administration, Methodology, Funding acquisition, Conceptualization. LC: Writing &#x2013; original draft, Validation, Methodology, Formal Analysis, Data curation. PC: Writing &#x2013; review &#x0026; editing, Methodology, Formal Analysis, Data curation. YD: Writing &#x2013; review &#x0026; editing, Validation, Methodology, Funding acquisition, Data curation. HL: Writing &#x2013; original draft, Visualization, Methodology, Investigation, Data curation. YL: Writing &#x2013; original draft, Methodology, Data curation, Conceptualization. QD: Writing &#x2013; review &#x0026; editing, Visualization, Project administration, Methodology. PL: Writing &#x2013; review &#x0026; editing, Project administration, Methodology.</p>
</sec>
<sec id="s9" sec-type="funding-information"><title>Funding</title>
<p>The author(s) declare financial support was received for the research, authorship, and/or publication of this article.</p>
<p>Z-XH was supported by the Science and Technology Program of Guangzhou, China (2024B03J0436), and Research Funds of Centre for Leading Medicine and Advanced Technologies of IHM (No. 2023IHM01052). YD was supported by the Medical Scientific Research Foundation of Guangdong Province, China (B2021382). The funding source had no role in study design, data collection, analysis, or interpretation.</p>
</sec>
<ack><title>Acknowledgments</title>
<p>We thank all the community populations who participated in the study and the health professionals who helped with the data collection.</p>
</ack>
<sec id="s10" sec-type="COI-statement"><title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec id="s11" sec-type="disclaimer"><title>Publisher&#x0027;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<ref-list><title>References</title>
<ref id="B1"><label>1.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kato</surname><given-names>A</given-names></name><name><surname>Minami</surname><given-names>Y</given-names></name><name><surname>Asakura</surname><given-names>K</given-names></name><name><surname>Katamine</surname><given-names>M</given-names></name><name><surname>Katsura</surname><given-names>A</given-names></name><name><surname>Muramatsu</surname><given-names>Y</given-names></name><etal/></person-group> <article-title>Characteristics of carotid atherosclerosis in patients with plaque erosion</article-title>. <source>J Thromb Thrombolysis</source>. (<year>2021</year>) <volume>52</volume>(<issue>2</issue>):<fpage>620</fpage>&#x2013;<lpage>7</lpage>. <pub-id pub-id-type="doi">10.1007/s11239-021-02419-1</pub-id><pub-id pub-id-type="pmid">33694096</pub-id></citation></ref>
<ref id="B2"><label>2.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Li</surname><given-names>W</given-names></name><name><surname>Luo</surname><given-names>J</given-names></name><name><surname>Peng</surname><given-names>F</given-names></name><name><surname>Liu</surname><given-names>R</given-names></name><name><surname>Bai</surname><given-names>X</given-names></name><name><surname>Wang</surname><given-names>T</given-names></name><etal/></person-group> <article-title>Spatial metabolomics identifies lipid profiles of human carotid atherosclerosis</article-title>. <source>Atherosclerosis</source>. (<year>2023</year>) <volume>364</volume>:<fpage>20</fpage>&#x2013;<lpage>8</lpage>. <pub-id pub-id-type="doi">10.1016/j.atherosclerosis.2022.11.019</pub-id><pub-id pub-id-type="pmid">36459728</pub-id></citation></ref>
<ref id="B3"><label>3.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kassem</surname><given-names>M</given-names></name><name><surname>Nies</surname><given-names>KPH</given-names></name><name><surname>Boswijk</surname><given-names>E</given-names></name><name><surname>van der Pol</surname><given-names>J</given-names></name><name><surname>Aizaz</surname><given-names>M</given-names></name><name><surname>Gijbels</surname><given-names>MJJ</given-names></name><etal/></person-group> <article-title>Quantification of carotid plaque composition with a multi-contrast atherosclerosis characterization (match) MRI sequence</article-title>. <source>Front Cardiovasc Med</source>. (<year>2023</year>) <volume>10</volume>:<fpage>1227495</fpage>. <pub-id pub-id-type="doi">10.3389/fcvm.2023.1227495</pub-id><pub-id pub-id-type="pmid">37680565</pub-id></citation></ref>
<ref id="B4"><label>4.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname><given-names>X</given-names></name><name><surname>Li</surname><given-names>W</given-names></name><name><surname>Song</surname><given-names>F</given-names></name><name><surname>Wang</surname><given-names>L</given-names></name><name><surname>Fu</surname><given-names>Q</given-names></name><name><surname>Cao</surname><given-names>S</given-names></name><etal/></person-group> <article-title>Carotid atherosclerosis detected by ultrasonography: a national cross-sectional study</article-title>. <source>J Am Heart Assoc</source>. (<year>2018</year>) <volume>7</volume>(<issue>8</issue>):<fpage>e008701</fpage>. <pub-id pub-id-type="doi">10.1161/JAHA.118.008701</pub-id><pub-id pub-id-type="pmid">29622590</pub-id></citation></ref>
<ref id="B5"><label>5.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hsiao</surname><given-names>CL</given-names></name><name><surname>Chen</surname><given-names>PY</given-names></name><name><surname>Hsu</surname><given-names>PJ</given-names></name><name><surname>Lin</surname><given-names>SK</given-names></name></person-group>. <article-title>Nomogram and carotid risk score for predicting moderate or high carotid atherosclerosis among asymptomatic elderly recycling volunteers</article-title>. <source>Diagnostics (Basel)</source>. (<year>2022</year>) <volume>12</volume>(<issue>6</issue>):<fpage>1407</fpage>. <pub-id pub-id-type="doi">10.3390/diagnostics12061407</pub-id><pub-id pub-id-type="pmid">35741217</pub-id></citation></ref>
<ref id="B6"><label>6.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Fu</surname><given-names>J</given-names></name><name><surname>Deng</surname><given-names>Y</given-names></name><name><surname>Ma</surname><given-names>Y</given-names></name><name><surname>Man</surname><given-names>S</given-names></name><name><surname>Yang</surname><given-names>X</given-names></name><name><surname>Yu</surname><given-names>C</given-names></name><etal/></person-group> <article-title>National and provincial-level prevalence and risk factors of carotid atherosclerosis in Chinese adults</article-title>. <source>JAMA Netw Open</source>. (<year>2024</year>) <volume>7</volume>(<issue>1</issue>):<fpage>e2351225</fpage>. <pub-id pub-id-type="doi">10.1001/jamanetworkopen.2023.51225</pub-id><pub-id pub-id-type="pmid">38206625</pub-id></citation></ref>
<ref id="B7"><label>7.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Huang</surname><given-names>G</given-names></name><name><surname>Jin</surname><given-names>Q</given-names></name><name><surname>Tian</surname><given-names>X</given-names></name><name><surname>Mao</surname><given-names>Y</given-names></name></person-group>. <article-title>Development and validation of a carotid atherosclerosis risk prediction model based on a Chinese population</article-title>. <source>Front Cardiovasc Med</source>. (<year>2022</year>) <volume>9</volume>:<fpage>946063</fpage>. <pub-id pub-id-type="doi">10.3389/fcvm.2022.946063</pub-id><pub-id pub-id-type="pmid">35983181</pub-id></citation></ref>
<ref id="B8"><label>8.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Shimizu</surname><given-names>Y</given-names></name><name><surname>Yamanashi</surname><given-names>H</given-names></name><name><surname>Honda</surname><given-names>Y</given-names></name><name><surname>Nonaka</surname><given-names>F</given-names></name><name><surname>Miyata</surname><given-names>J</given-names></name><name><surname>Kawashiri</surname><given-names>SY</given-names></name><etal/></person-group> <article-title>Low-density lipoprotein cholesterol, structural atherosclerosis, and functional atherosclerosis in older Japanese</article-title>. <source>Nutrients</source>. (<year>2022</year>) <volume>15</volume>(<issue>1</issue>):<fpage>183</fpage>. <pub-id pub-id-type="doi">10.3390/nu15010183</pub-id><pub-id pub-id-type="pmid">36615839</pub-id></citation></ref>
<ref id="B9"><label>9.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zeng</surname><given-names>N</given-names></name><name><surname>Shen</surname><given-names>Y</given-names></name><name><surname>Li</surname><given-names>Y</given-names></name><name><surname>Wang</surname><given-names>Y</given-names></name></person-group>. <article-title>Association between remnant cholesterol and subclinical carotid atherosclerosis among Chinese general population in health examination</article-title>. <source>J Stroke Cerebrovasc Dis</source>. (<year>2023</year>) <volume>32</volume>(<issue>8</issue>):<fpage>107234</fpage>. <pub-id pub-id-type="doi">10.1016/j.jstrokecerebrovasdis.2023.107234</pub-id><pub-id pub-id-type="pmid">37392486</pub-id></citation></ref>
<ref id="B10"><label>10.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Huang</surname><given-names>ZX</given-names></name><name><surname>Chen</surname><given-names>LH</given-names></name><name><surname>Xiong</surname><given-names>R</given-names></name><name><surname>He</surname><given-names>YN</given-names></name><name><surname>Zhang</surname><given-names>Z</given-names></name><name><surname>Zeng</surname><given-names>J</given-names></name><etal/></person-group> <article-title>Essen stroke risk score predicts carotid atherosclerosis in Chinese community populations</article-title>. <source>Risk Manag Healthc Policy</source>. (<year>2020</year>) <volume>13</volume>:<fpage>2115</fpage>&#x2013;<lpage>23</lpage>. <pub-id pub-id-type="doi">10.2147/RMHP.S274340</pub-id><pub-id pub-id-type="pmid">33116991</pub-id></citation></ref>
<ref id="B11"><label>11.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hung</surname><given-names>AM</given-names></name><name><surname>Tsuchida</surname><given-names>Y</given-names></name><name><surname>Nowak</surname><given-names>KL</given-names></name><name><surname>Sarkar</surname><given-names>S</given-names></name><name><surname>Chonchol</surname><given-names>M</given-names></name><name><surname>Whitfield</surname><given-names>V</given-names></name><etal/></person-group> <article-title>Il-1 inhibition and function of the HDL-containing fraction of plasma in patients with stages 3 to 5 CKD</article-title>. <source>Clin J Am Soc Nephrol</source>. (<year>2019</year>) <volume>14</volume>(<issue>5</issue>):<fpage>702</fpage>&#x2013;<lpage>11</lpage>. <pub-id pub-id-type="doi">10.2215/CJN.04360418</pub-id><pub-id pub-id-type="pmid">31015261</pub-id></citation></ref>
<ref id="B12"><label>12.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Shearston</surname><given-names>K</given-names></name><name><surname>Tan</surname><given-names>JTM</given-names></name><name><surname>Cochran</surname><given-names>BJ</given-names></name><name><surname>Rye</surname><given-names>KA</given-names></name></person-group>. <article-title>Inhibition of vascular inflammation by apolipoprotein A-IV</article-title>. <source>Front Cardiovasc Med</source>. (<year>2022</year>) <volume>9</volume>:<fpage>901408</fpage>. <pub-id pub-id-type="doi">10.3389/fcvm.2022.901408</pub-id><pub-id pub-id-type="pmid">35845068</pub-id></citation></ref>
<ref id="B13"><label>13.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chen</surname><given-names>C</given-names></name><name><surname>Chang</surname><given-names>CC</given-names></name><name><surname>Lee</surname><given-names>IT</given-names></name><name><surname>Huang</surname><given-names>CY</given-names></name><name><surname>Lin</surname><given-names>FY</given-names></name><name><surname>Lin</surname><given-names>SJ</given-names></name><etal/></person-group> <article-title>High-density lipoprotein protects vascular endothelial cells from indoxyl sulfate insults through its antioxidant ability</article-title>. <source>Cell Cycle</source>. (<year>2023</year>) <volume>22</volume>(<issue>21&#x2013;22</issue>):<fpage>2409</fpage>&#x2013;<lpage>23</lpage>. <pub-id pub-id-type="doi">10.1080/15384101.2023.2296184</pub-id><pub-id pub-id-type="pmid">38129288</pub-id></citation></ref>
<ref id="B14"><label>14.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Pan</surname><given-names>B</given-names></name><name><surname>Kong</surname><given-names>J</given-names></name><name><surname>Jin</surname><given-names>J</given-names></name><name><surname>Kong</surname><given-names>J</given-names></name><name><surname>He</surname><given-names>Y</given-names></name><name><surname>Dong</surname><given-names>S</given-names></name><etal/></person-group> <article-title>A novel anti-inflammatory mechanism of high density lipoprotein through up-regulating annexin A1 in vascular endothelial cells</article-title>. <source>Biochim Biophys Acta</source>. (<year>2016</year>) <volume>1861</volume>(<issue>6</issue>):<fpage>501</fpage>&#x2013;<lpage>12</lpage>. <pub-id pub-id-type="doi">10.1016/j.bbalip.2016.03.022</pub-id><pub-id pub-id-type="pmid">27012521</pub-id></citation></ref>
<ref id="B15"><label>15.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Goecks</surname><given-names>J</given-names></name><name><surname>Jalili</surname><given-names>V</given-names></name><name><surname>Heiser</surname><given-names>LM</given-names></name><name><surname>Gray</surname><given-names>JW</given-names></name></person-group>. <article-title>How machine learning will transform biomedicine</article-title>. <source>Cell</source>. (<year>2020</year>) <volume>181</volume>(<issue>1</issue>):<fpage>92</fpage>&#x2013;<lpage>101</lpage>. <pub-id pub-id-type="doi">10.1016/j.cell.2020.03.022</pub-id><pub-id pub-id-type="pmid">32243801</pub-id></citation></ref>
<ref id="B16"><label>16.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Conroy</surname><given-names>RM</given-names></name><name><surname>Pyorala</surname><given-names>K</given-names></name><name><surname>Fitzgerald</surname><given-names>AP</given-names></name><name><surname>Sans</surname><given-names>S</given-names></name><name><surname>Menotti</surname><given-names>A</given-names></name><name><surname>De Backer</surname><given-names>G</given-names></name><etal/></person-group> <article-title>Estimation of ten-year risk of fatal cardiovascular disease in Europe: the score project</article-title>. <source>Eur Heart J</source>. (<year>2003</year>) <volume>24</volume>(<issue>11</issue>):<fpage>987</fpage>&#x2013;<lpage>1003</lpage>. <pub-id pub-id-type="doi">10.1016/s0195-668x(03)00114-3</pub-id><pub-id pub-id-type="pmid">12788299</pub-id></citation></ref></ref-list>
</back>
</article>