<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="2.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Endocrinol.</journal-id>
<journal-title>Frontiers in Endocrinology</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Endocrinol.</abbrev-journal-title>
<issn pub-type="epub">1664-2392</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fendo.2025.1655828</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Endocrinology</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Prediction of malignancy risk in Bethesda III nodules: development and validation of multiple machine learning models</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Li</surname>
<given-names>Wentian</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/3115971/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Zhu</surname>
<given-names>Jiayu</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Wang</surname>
<given-names>Ying</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/3183082/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Li</surname>
<given-names>Jingxiu</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Li</surname>
<given-names>Zhonghui</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Wang</surname>
<given-names>Cuicui</given-names>
</name>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Xue</surname>
<given-names>Jingli</given-names>
</name>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Zhou</surname>
<given-names>Peng</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="author-notes" rid="fn001">
<sup>*</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2083735/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>He</surname>
<given-names>Qingqing</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="author-notes" rid="fn001">
<sup>*</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1914377/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>Shandong First Medical University (Shandong Academy of Medical Sciences)</institution>, <addr-line>Jinan, Shandong</addr-line>,&#xa0;<country>China</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>Department of Thyroid &amp; Breast Surgery, The 960th Hospital of the PLA Joint Logistics Support Force</institution>, <addr-line>Jinan</addr-line>,&#xa0;<country>China</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>Shandong University of Traditional Chinese Medicine</institution>, <addr-line>Jinan, Shandong</addr-line>,&#xa0;<country>China</country>
</aff>
<aff id="aff4">
<sup>4</sup>
<institution>Department of Pathology, The 960th Hospital of the PLA Joint Logistics Support Force</institution>, <addr-line>Jinan</addr-line>,&#xa0;<country>China</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>Edited by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/2973224/overview">Lisa Jia Tran</ext-link>, Ludwig Maximilian University of Munich, Germany</p>
</fn>
<fn fn-type="edited-by">
<p>Reviewed by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1885408/overview">Jincao Yao</ext-link>, University of Chinese Academy of Sciences, China</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1474805/overview">Shahram Taeb</ext-link>, Gilan University of Medical Sciences, Iran</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/3155015/overview">Ricardo V. Garcia-Mayor</ext-link>, Instituto de Investigaci&#xf3;n Sanitaria Galicia Sur (IISGS), Spain</p>
</fn>
<fn fn-type="corresp" id="fn001">
<p>*Correspondence: Qingqing He, <email xlink:href="mailto:heqingqing@yeah.net">heqingqing@yeah.net</email>; Peng Zhou, <email xlink:href="mailto:weardzp@126.com">weardzp@126.com</email>
</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>29</day>
<month>08</month>
<year>2025</year>
</pub-date>
<pub-date pub-type="collection">
<year>2025</year>
</pub-date>
<volume>16</volume>
<elocation-id>1655828</elocation-id>
<history>
<date date-type="received">
<day>28</day>
<month>06</month>
<year>2025</year>
</date>
<date date-type="accepted">
<day>18</day>
<month>08</month>
<year>2025</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2025 Li, Zhu, Wang, Li, Li, Wang, Xue, Zhou and He</copyright-statement>
<copyright-year>2025</copyright-year>
<copyright-holder>Li, Zhu, Wang, Li, Li, Wang, Xue, Zhou and He</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<sec>
<title>Objective</title>
<p>To develop and validate a machine learning (ML)-based prediction model of Bethesda III nodules and create a nomogram based on the best model.</p>
</sec>
<sec>
<title>Methods</title>
<p>We collected data on patients with Bethesda III nodules who were admitted between January 2020 and June 2024, including 276 Bethesda III nodules from 7371 patients who underwent ultrasound-guided fine needle aspiration (US-FNA). Clinical, ultrasonographic, cytological, laboratory, and molecular data were collected and randomly split into training and validation cohorts at a ratio of 7: 3. Six feature selection methods and ML algorithms&#x2014;Logistic Regression (LR), Decision Tree (DT), Random Forest (RF), Extreme Gradient Boosting (XGB), Support Vector Machine (SVM), and K-Nearest Neighbors (KNN)&#x2014;were evaluated. A nomogram was then created based on the best-performing model.</p>
</sec>
<sec>
<title>Results</title>
<p>The study cohort included 276 Bethesda III nodules with a final malignancy rate of 65.2% (180/276). LR exhibited the highest area under the receiver operating characteristic (ROC) curve (AUC: 0.823) in cross-validation of the validation set. Additionally, the calibration curves and Decision Curve Analysis (DCA) results were also favorable. The model included BRAF, composition, shape, orientation, and the thyroid imaging reporting and data system (TI-RADS). The nomogram exhibited robust discrimination (AUC: 0.846 in the validation set), calibration, and clinical applicability across the two datasets after 500 bootstraps.</p>
</sec>
<sec>
<title>Conclusion</title>
<p>Among the six ML algorithms, the LR algorithm demonstrated the best performance. A nomogram was developed to predict the malignancy risk in Bethesda III nodules. This nomogram may serve as a valuable tool to reduce diagnostic uncertainty and provide personalized risk stratification for patients.</p>
</sec>
</abstract>
<kwd-group>
<kwd>thyroid nodules</kwd>
<kwd>risk of malignancy</kwd>
<kwd>atypia of undetermined significance</kwd>
<kwd>machine learning</kwd>
<kwd>prediction model</kwd>
</kwd-group>
<counts>
<fig-count count="4"/>
<table-count count="3"/>
<equation-count count="0"/>
<ref-count count="59"/>
<page-count count="17"/>
<word-count count="8553"/>
</counts>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-in-acceptance</meta-name>
<meta-value>Thyroid Endocrinology</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec id="s1" sec-type="intro">
<label>1</label>
<title>Introduction</title>
<p>Thyroid nodules affect approximately 25% of the general population, making them a prevalent clinical condition. The widespread use of high-resolution ultrasound has significantly increased the detection rate of thyroid nodules, with 65% of individuals identified with nodules during ultrasound examinations (<xref ref-type="bibr" rid="B1">1</xref>, <xref ref-type="bibr" rid="B2">2</xref>). Although most of these nodules are benign, it remains critical to accurately distinguish malignant lesions to avoid overtreatment and ensure timely intervention. The Bethesda System for Reporting Thyroid Cytopathology (TBSRTC) categorizes fine needle aspiration results into six classifications: (I) non-diagnostic; (II) benign; (III) atypia of undetermined significance (AUS); (IV) follicular neoplasm; (V) suspicious for malignancy; and (VI) malignant. Bethesda III nodules present consistent diagnostic challenges among these categories (<xref ref-type="bibr" rid="B3">3</xref>). The frequency of Bethesda III nodules diagnoses varies significantly across laboratories, ranging from 8.6% to 25.3%. While the Bethesda system estimates the malignancy risk for Bethesda III nodules to range from 13% to 30%, clinical data suggest that the actual malignancy rate may be higher, between 23.5% and 40% (<xref ref-type="bibr" rid="B4">4</xref>&#x2013;<xref ref-type="bibr" rid="B7">7</xref>). The complexity and uncertainty of Bethesda III nodules underscore the urgent need for comprehensive studies to identify preoperative predictors for these nodules.</p>
<p>Preoperative prediction of the benign or malignant nature of Bethesda III nodules necessitates a comprehensive evaluation that incorporates ultrasound features, molecular testing, thyroid function assessments, and demographic factors such as age and gender. While these factors provide some predictive value for the malignancy of Bethesda III nodules, they each have inherent limitations. For example, the BRAF gene is a highly specific biomarker for papillary thyroid carcinoma (PTC), with a malignancy risk of 98.9% to 100%. However, its mutation rate is only 35% to 77% (<xref ref-type="bibr" rid="B8">8</xref>&#x2013;<xref ref-type="bibr" rid="B10">10</xref>), and malignancy is particularly difficult to exclude in follicular subtype Bethesda III nodules when assessed in isolation (<xref ref-type="bibr" rid="B11">11</xref>). Molecular testing using a 12-gene panel can improve the diagnostic accuracy of Bethesda III nodules by detecting key mutations such as BRAF, TERT promoter, NRAS/HRAS/KRAS, PIK3CA, AKT1, RET fusions, NTRK fusions, and PAX8-PPAR&#x3b3;. Bethesda III nodules with negative genetic mutations from this panel exhibit a 6% malignancy risk, with less than a 1% risk of cancer spreading beyond the thyroid (<xref ref-type="bibr" rid="B12">12</xref>, <xref ref-type="bibr" rid="B13">13</xref>). However, the high cost of the 12-gene panel limits its broader application in China. Thus, a combined approach integrating demographic, imaging, and molecular data may enhance diagnostic accuracy. To our knowledge, there are still few studies specifically addressing the prediction of malignancy risk in Bethesda III nodules (<xref ref-type="bibr" rid="B14">14</xref>&#x2013;<xref ref-type="bibr" rid="B16">16</xref>).</p>
<p>Machine learning is the scientific study of algorithms and statistical models that enable computers to perform specific tasks without explicit programming, offering notable advantages in the field of thyroid surgery (<xref ref-type="bibr" rid="B17">17</xref>). Emerging evidence suggests multimodal GPTs may improve diagnostic accuracy through integrated data analysis (<xref ref-type="bibr" rid="B18">18</xref>&#x2013;<xref ref-type="bibr" rid="B20">20</xref>). Radiomics has recently demonstrated effectiveness in automating thyroid nodule classification and risk stratification (<xref ref-type="bibr" rid="B16">16</xref>). Compared to traditional logistic regression models, ML excels in handling complex clinical data, facilitating the development of predictive tools that, in specific cases, outperform conventional statistical models (<xref ref-type="bibr" rid="B21">21</xref>). Although AI research in thyroidology continues to advance, there is limited exploration focused on the most clinically challenging Bethesda III nodules. Recent studies have nevertheless achieved promising results in predicting malignancy for these nodules using machine learning. Cao et&#xa0;al. (<xref ref-type="bibr" rid="B14">14</xref>) developed a nomogram with 0.80 AUC by comparing machine learning methods to logistic regression, whereas Zhong et&#xa0;al. (<xref ref-type="bibr" rid="B16">16</xref>) reported 0.823 AUC but with narrower applicability. Our study employs machine learning algorithms to integrate multidimensional data, including ultrasound features, clinical parameters, and molecular biomarkers, to develop a personalized malignancy risk prediction model for Bethesda III nodules. Through systematic comparison of advanced algorithms with LR, we aim to develop a visual decision support tool that reduces diagnostic uncertainty, prevents unnecessary surgeries, and provides personalized risk stratification for patients.</p>
</sec>
<sec id="s2" sec-type="materials|methods">
<label>2</label>
<title>Materials and methods</title>
<sec id="s2_1">
<label>2.1</label>
<title>Study cohort</title>
<p>This retrospective observational study was approved by the 960th Hospital of the PLA Joint Logistics Support Force Research Ethics Committee (No. 2024-171). Research participants were performed in accordance with the Declaration of Helsinki, and each patient provided written informed consent. All eligible patients were informed about the use of their data for study and had the option to decline to participate (<xref ref-type="bibr" rid="B22">22</xref>).</p>
<p>This study included patients with thyroid nodules diagnosed as Bethesda III nodules based on initial FNA between January 2020 and June 2024. Final diagnoses were confirmed through repeat biopsies, 12-gene testing, or surgery (<xref ref-type="bibr" rid="B23">23</xref>). Inclusion criteria included: (1) thyroid nodules classified as Bethesda III on FNA cytology; (2) preoperative ultrasound, molecular testing, and thyroid function tests; (3) patients underwent thyroidectomy; (4) at least one repeat FNA on the same Bethesda III nodule within one year; (5) 12-gene panel testing. Exclusion criteria included: (1) other thyroid cancer types, such as follicular carcinoma or medullary thyroid carcinoma; (2) patients lacking laboratory, imaging, or pathological data; (3) uncertain repeat FNA results; (4) any mutations detected in the 12-gene test; (5) patients without at least six months of follow-up after repeat FNA or 12-gene testing. Patients were randomly assigned to a training set and a validation set in a 7:3 ratio. The training set was used to develop models with various machine learning algorithms, and the validation set was used to evaluate model performance.</p>
</sec>
<sec id="s2_2">
<label>2.2</label>
<title>Clinical features and data collection</title>
<p>Data for the variables assessed in this study were collected from patients&#x2019; hospitalization electronic medical records (EMRs), including basic patient information, thyroid imaging reporting and data system, cytological assessments, molecular testing following US-FNA, laboratory indicators (within one month before surgery) and postoperative pathological data. Basic patient information included age and sex. Ultrasound features of thyroid nodules were analyzed using TI-RADS terminology, including size, composition, echogenicity, margin, shape, echogenic foci, halo, orientation, location, color Doppler flow imaging (CDFI) pattern, echotexture, posterior features, cervical lymph nodes and solitary nodule (<xref ref-type="bibr" rid="B24">24</xref>). The largest transverse, anteroposterior, and vertical diameters of all nodules were recorded, with the largest of these three measurements used to assess nodule size. Additional features of the nodule were recorded according to C-TIRADS. C-TIRADS classified the nodules by assigning points for composition, echogenicity, shape, margin, and echogenic foci to determine the TIRADS level. Cervical lymph nodes were considered abnormal if they exhibited any of the following features: (a) loss of central hilar echo, (b) cystic change, (c) calcification, (d) cortical hyperechogenicity, (e) increased and irregular vascularity, or (f) cervical lymphadenopathy. Two radiologists reviewed and documented all sonographic characteristics of the thyroid nodules. Disagreements were resolved through discussion or consultation with a third radiologist. In cytological assessments and molecular testing, cytologists examined the cells and cellular structures according to the second edition of the Bethesda System for Reporting Thyroid Cytopathology (<xref ref-type="bibr" rid="B3">3</xref>). Bethesda III cases were reviewed and categorized into the following subtypes: (1) AUS-nuclear atypia: Includes focal nuclear atypia or mild but extensive nuclear atypia; (2) AUS-other: Includes architectural atypia (often sparsely cellular samples predominantly composed of microfollicles) and Hurthle cell atypia (oncocytic features). Two molecular tests were available at our institution: BRAF and a twelve-gene molecular panel. Patients underwent twelve-gene panel testing, which included BRAF, RAS (NRAS, HRAS, KRAS), PIK3CA, AKT1, RET, CCDC6-RET, NCOA4-RET, TP53, ETV6-NTRK3, TPM3-NTRK1, TERT, and PAX8-PPARG promoters. Laboratory indicators obtained included thyroid stimulating hormone (TSH), free thyroxine (FT4), free triiodothyronine (FT3), thyroglobulin antibody (TgAb), thyroid peroxidase antibody (TPOAb), and thyroglobulin (Tg) levels. All predictive factors were derived from objective data and image archiving in the EMRs.</p>
</sec>
<sec id="s2_3">
<label>2.3</label>
<title>Assessment of study outcomes</title>
<p>The definitive diagnosis of malignant tumors was confirmed through histopathological analysis of surgically excised tissue or repeated fine-needle aspiration biopsies with malignant results (Bethesda categories V or VI). In contrast, benign nodules were diagnosed based on one of the following criteria: (1) histopathological confirmation from surgically excised specimens, (2) absence of mutations in a 12-gene panel, or (3) at least one benign FNA result (Bethesda II) from repeated biopsies, with no subsequent malignant findings. All patients who did not undergo surgical intervention were followed up with ultrasonography for at least six months to assess any suspicious changes in the nodules. Histopathological results were independently reviewed by two experienced pathologists, and any discrepancies were resolved through consultation with a third pathologist.</p>
</sec>
<sec id="s2_4">
<label>2.4</label>
<title>Sample size calculation</title>
<p>We calculated the required sample size using the events per variable (EPV) metric, a widely recognized method in statistical analysis (<xref ref-type="bibr" rid="B25">25</xref>&#x2013;<xref ref-type="bibr" rid="B27">27</xref>). We also followed the 4-step procedure proposed by Riley et&#xa0;al. (<xref ref-type="bibr" rid="B28">28</xref>) to calculate the required sample size (<xref ref-type="bibr" rid="B29">29</xref>). According to guidelines, the malignancy rate of Bethesda III nodules typically ranges from 13% to 30% based on follow-up of surgically resected nodules (<xref ref-type="bibr" rid="B3">3</xref>). Since we intended to include patients who had not undergone surgery, the expected proportion of the endpoint event was estimated at 0.15. The calculation process, formulas, and results are shown in <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S2</bold>
</xref>.</p>
</sec>
<sec id="s2_5">
<label>2.5</label>
<title>Data preprocessing</title>
<p>Statistical analyses were conducted using SPSS 25.0 software and R (version 4.4.2; R Foundation, Vienna, Austria), with a significance level set at p &lt; 0.05. The &#x201c;mice&#x201d; package in R was used to assess the missing data mechanism, and the VIM package was used for data visualization. Multiple imputation was used to handle missing data, with 10 imputations performed based on the established MAR mechanism, as recommended by standard guidelines. The Multiple Imputation by Chained Equations (MICE) method was used for imputation, implemented through the &#x201c;mice&#x201d; package in R. The imputation model with the lowest Bayesian Information Criterion (BIC) was chosen for data optimization. Continuous variables were imputed using predictive mean matching, categorical variables using logistic regression, and multinomial variables using multinomial logistic regression. All relevant covariates, including predictors, outcome variables, and other variables not included in the predictive model, were incorporated into the imputation model to capture the relationships among the variables.</p>
</sec>
<sec id="s2_6">
<label>2.6</label>
<title>Selection of variables</title>
<p>
<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figure S1</bold>
</xref> presents the complete study flowchart. Before constructing the predictive model, six feature selection methods were applied to mitigate the high correlation between predictor variables and improve both the predictive accuracy and interpretability of the model. These methods were chosen based on their proven effectiveness in handling high-dimensional data and identifying the most relevant predictor variables in predictive modeling. In clinical prediction models, the combined use of multiple variable selection methods can compensate for the limitations of individual approaches, thereby enhancing the stability of variable selection and the predictive performance of the model (<xref ref-type="bibr" rid="B30">30</xref>, <xref ref-type="bibr" rid="B31">31</xref>). The feature selection methods used include:</p>
<list list-type="order">
<list-item>
<p>Stepwise Regression (SR): This method uses a stepwise selection mechanism to dynamically adjust explanatory variables in the model based on hypothesis testing results, effectively extracting core influencing factors while alleviating collinearity issues. We implemented three variations of stepwise regression: forward selection (FS), backward selection (BS), and bidirectional elimination (BE).</p>
</list-item>
<list-item>
<p>Least Absolute Shrinkage and Selection Operator (LASSO): This method performs variable selection and regularization by adding an L1 penalty to the regression coefficients. It is particularly effective for high-dimensional data, especially when dealing with small sample sizes and high multicollinearity between predictor variables (<xref ref-type="bibr" rid="B32">32</xref>).</p>
</list-item>
<list-item>
<p>Boruta: Built upon the random forest framework, this algorithm constructs a feature evaluation mechanism by comparing the dynamic importance between original variables and shadow variables, using two-tailed statistical validation to achieve precise separation of feature signals and ensuring the retention of all relevant features.</p>
</list-item>
<list-item>
<p>Random Forest-Recursive Feature Elimination (RF-RFE): This method uses an iterative elimination strategy to optimize feature subsets, ensuring their relevance to the classifier and thereby improving model performance.</p>
</list-item>
</list>
<p>We summarized 29 candidate predictors selected through various filtering methods and took their intersection. Finally, we consulted with clinical experts and combined them with clinical reality to determine the final predictors for constructing Bethesda III nodules malignancy prediction model.</p>
</sec>
<sec id="s2_7">
<label>2.7</label>
<title>Model development and performance comparison</title>
<p>Six machine learning models were used to predict the malignancy of Bethesda III nodules: LR (glm stats package), DT (rpart package), RF (randomForest package), XGB (xgboost package), SVM (e1071 package), and KNN (kknn package). The selected clinical features were fed into the six models using various machine learning algorithms. To evaluate the models&#x2019; performance on unseen data, five-fold cross-validation was applied to obtain the parameters. Performance metrics from the confusion matrix were used to assess model efficacy in both the training and validation cohorts, including the Receiver Operating Characteristic curve, sensitivity (SEN), specificity (SPE), positive predictive value (PPV), negative predictive value (NPV), accuracy (ACC), F1 score, and Brier score. A calibration curve was used to compare predicted probabilities with actual outcomes. Decision Curve Analysis was used to evaluate the net benefit of the models at various thresholds. Additionally, the DeLong test was used to determine whether significant differences existed in the AUC values of the models. Based on the evaluation of these metrics in both the training and testing sets, the optimal model was selected.</p>
</sec>
<sec id="s2_8">
<label>2.8</label>
<title>Model explanation</title>
<p>LR was selected as the optimal model based on its performance. The model&#x2019;s performance was demonstrated using 500 bootstrap samples, including the ROC curve, calibration curve, and DCA results. To assess model interpretability and evaluation, we calculated the AUC to evaluate the model&#x2019;s discriminative ability and examined its calibration using the Hosmer-Lemeshow (HL) test. DCA was used to evaluate the net benefit at different thresholds, providing a comprehensive assessment of the model&#x2019;s effectiveness in real-world medical decision-making scenarios. Bootstrapping, a statistical method, was applied to estimate model accuracy by repeatedly sampling with replacement from the original dataset. The model was trained on these new datasets and evaluated using out-of-bag data. This process was repeated several times to obtain a distribution of performance metrics, yielding a robust estimate of model reliability and variance. The nomogram score is the sum of the scores assigned to each risk factor, where higher scores indicate a greater risk of Bethesda III nodules malignancy. This graphical tool simplifies the estimation of individual risk or probability based on the variables predicted by the model.</p>
</sec>
<sec id="s2_9">
<label>2.9</label>
<title>Statistical analysis</title>
<p>All analyses were conducted in R. For continuous variables, the Shapiro-Wilk test was used to assess their normality. This test was selected because it generally performs better than other tests, such as the Kolmogorov-Smirnov test, particularly with small sample sizes. Variables following a normal distribution were described using the mean &#xb1; standard deviation, while non-normally distributed variables were described using the median and interquartile range, providing more robust measures of central tendency and variability in the presence of outliers. Frequency and percentage were reported for categorical variables. To assess collinearity between variables, the variance inflation factor (VIF) was calculated. A VIF value below 5 and tolerance greater than 0.1 typically indicate no significant collinearity between variables. This metric helps ensure that our regression models are not unduly affected by multicollinearity, which can distort the estimated relationships between predictors and outcomes. Fisher&#x2019;s exact test was used for categorical variables with low expected frequencies to ensure accurate significance testing. This test provides a precise method for determining the likelihood of observing a given set of frequencies in categorical variables, particularly useful with small sample sizes. Several R packages were used for specific analyses: comparegroups for baseline description, glmnet for LASSO regression, forestmodel for forest plots, pROC, ggROC, and fbroc for discriminative analysis, PRROC for PR curves, rms for calibration using val.prob and calibrate functions, ResourceSelection for the Hosmer-Lemeshow test, dcurves for DCA, and rms for nomogram construction.</p>
</sec>
</sec>
<sec id="s3" sec-type="results">
<label>3</label>
<title>Result</title>
<sec id="s3_1">
<label>3.1</label>
<title>Study cohort and baseline information</title>
<p>Between January 2020 and June 2024, 7,371 patients underwent ultrasound-guided fine needle aspiration, while 2,761 patients underwent thyroidectomy. Among the thyroid nodules assessed by US-FNA, 10.2% (754/7,398) were diagnosed with Bethesda III nodules. Of these Bethesda III nodules, 31.6% (238/754) underwent surgical resection, 7.3% (55/754) underwent repeat biopsies, and 6.9% (52/754) were subjected to 12-gene panel testing. Notably, 36.4% (20/55) of the Bethesda III nodules that underwent repeat biopsies had indeterminate results. A total of 69 patients were excluded due to incomplete records (<xref ref-type="bibr" rid="B16">16</xref>), other pathologically confirmed thyroid cancer types (<xref ref-type="bibr" rid="B2">2</xref>), uncertain repeat biopsy outcomes (<xref ref-type="bibr" rid="B20">20</xref>), mutations found by 12-gene panel testing (<xref ref-type="bibr" rid="B1">1</xref>), or insufficient follow-up for at least six months after repeat biopsy or 12-gene panel testing (<xref ref-type="bibr" rid="B30">30</xref>). Consequently, the current study included 271 patients: 213 females and 58 males, with a total of 276 Bethesda III nodules. Approximately 65.2% (180/276) of the nodules were malignant, while 34.8% (96/276) were benign. BRAF mutations were detected in 41% (113/276) of the cases. In our dataset, only 36 cases (13.04%) were classified as AUS and 25 (9.06%) as FLUS. Neither AUS nor FLUS showed statistical significance in the univariate analysis. The median age of patients was 51 years (IQR 41.00&#x2013;57.25), and the median nodule size was 5.2&#xa0;mm (IQR 4.00&#x2013;7.70). In the current dataset, five variables were missing, all related to thyroid function tests, resulting in 232 missing values, or approximately 2.8% of the total data points. These missing values were distributed among multiple variables, as detailed in <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S1</bold>
</xref> and <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figure S2</bold>
</xref>. The cohort was randomly divided into a training set (n = 193) and a validation set (n = 83). As shown in <xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref>, no significant differences were observed in the baseline characteristics between the two groups (P &gt; 0.05).</p>
<table-wrap id="T1" position="float">
<label>Table&#xa0;1</label>
<caption>
<p>Baseline characteristics of all patients between the training and validation cohorts.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" align="left">Characteristics</th>
<th valign="middle" align="center">Total N=276</th>
<th valign="middle" align="center">Training N=193</th>
<th valign="middle" align="center">Testing N=83</th>
<th valign="middle" align="center">P value</th>
</tr>
</thead>
<tbody>
<tr>
<th valign="middle" align="left">Gender (%)</th>
<th valign="middle" align="center"/>
<th valign="middle" align="center"/>
<th valign="middle" align="center"/>
<th valign="middle" align="center">0.271</th>
</tr>
<tr>
<td valign="middle" align="left">Male</td>
<td valign="middle" align="center">60 (21.74)</td>
<td valign="middle" align="center">38 (19.69)</td>
<td valign="middle" align="center">22 (26.51)</td>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="middle" align="left">Female</td>
<td valign="middle" align="center">216 (78.26)</td>
<td valign="middle" align="center">155 (80.31)</td>
<td valign="middle" align="center">61 (73.49)</td>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="middle" align="left">Age (median [IQR])</td>
<td valign="middle" align="center">51.00[41.00;57.25]</td>
<td valign="middle" align="center">51.00[41.00;58.00]</td>
<td valign="middle" align="center">50.00 [36.00;56.50]</td>
<td valign="middle" align="center">0.245</td>
</tr>
<tr>
<th valign="middle" align="left">Nuclear atypia (%)</th>
<th valign="middle" align="center"/>
<th valign="middle" align="center"/>
<th valign="middle" align="center"/>
<th valign="middle" align="center">0.195</th>
</tr>
<tr>
<td valign="middle" align="left">Present</td>
<td valign="middle" align="center">36 (13.04)</td>
<td valign="middle" align="center">29 (15.03)</td>
<td valign="middle" align="center">7 (8.43)</td>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="middle" align="left">Absent</td>
<td valign="middle" align="center">240 (86.96)</td>
<td valign="middle" align="center">164 (84.97)</td>
<td valign="middle" align="center">76 (91.57)</td>
<td valign="middle" align="center"/>
</tr>
<tr>
<th valign="middle" align="left">Architectural atypia (%)</th>
<th valign="middle" align="center"/>
<th valign="middle" align="center"/>
<th valign="middle" align="center"/>
<th valign="middle" align="center">0.356</th>
</tr>
<tr>
<td valign="middle" align="left">Present</td>
<td valign="middle" align="center">25 (9.06)</td>
<td valign="middle" align="center">20 (10.36)</td>
<td valign="middle" align="center">5 (6.02)</td>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="middle" align="left">Absent</td>
<td valign="middle" align="center">251 (90.94)</td>
<td valign="middle" align="center">173 (89.64)</td>
<td valign="middle" align="center">78 (93.98)</td>
<td valign="middle" align="center"/>
</tr>
<tr>
<th valign="middle" align="left">BRAF<sup>V600E</sup> (%)</th>
<th valign="middle" align="center"/>
<th valign="middle" align="center"/>
<th valign="middle" align="center"/>
<th valign="middle" align="center">1.000</th>
</tr>
<tr>
<td valign="middle" align="left">Positive</td>
<td valign="middle" align="center">113 (40.94)</td>
<td valign="middle" align="center">79 (40.93)</td>
<td valign="middle" align="center">34 (40.96)</td>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="middle" align="left">Negative</td>
<td valign="middle" align="center">163 (59.06)</td>
<td valign="middle" align="center">114 (59.07)</td>
<td valign="middle" align="center">49 (59.04)</td>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="middle" align="left">Diameter (median [IQR])</td>
<td valign="middle" align="center">5.20 [4.00;7.70]</td>
<td valign="middle" align="center">5.30 [4.00;8.10]</td>
<td valign="middle" align="center">5.00 [4.00;7.00]</td>
<td valign="middle" align="center">0.513</td>
</tr>
<tr>
<th valign="middle" align="left">Solid composition (%)</th>
<th valign="middle" align="center"/>
<th valign="middle" align="center"/>
<th valign="middle" align="center"/>
<th valign="middle" align="center">0.188</th>
</tr>
<tr>
<td valign="middle" align="left">Yes</td>
<td valign="middle" align="center">236 (85.51)</td>
<td valign="middle" align="center">161 (83.42)</td>
<td valign="middle" align="center">75 (90.36)</td>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="middle" align="left">No</td>
<td valign="middle" align="center">40 (14.49)</td>
<td valign="middle" align="center">32 (16.58)</td>
<td valign="middle" align="center">8 (9.64)</td>
<td valign="middle" align="center"/>
</tr>
<tr>
<th valign="middle" align="left">Nodule position 1(%)</th>
<th valign="middle" align="center"/>
<th valign="middle" align="center"/>
<th valign="middle" align="center"/>
<th valign="middle" align="center">0.227</th>
</tr>
<tr>
<td valign="middle" align="left">Left lobe</td>
<td valign="middle" align="center">134 (48.55)</td>
<td valign="middle" align="center">98 (50.78)</td>
<td valign="middle" align="center">36(43.37)</td>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="middle" align="left">Right lobe</td>
<td valign="middle" align="center">133 (48.19)</td>
<td valign="middle" align="center">88 (45.60)</td>
<td valign="middle" align="center">45 (54.22)</td>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="middle" align="left">Isthmus</td>
<td valign="middle" align="center">9 (3.26)</td>
<td valign="middle" align="center">7 (3.63)</td>
<td valign="middle" align="center">2 (2.41)</td>
<td valign="middle" align="center"/>
</tr>
<tr>
<th valign="middle" align="left">Marked Hypoechoic(%)</th>
<th valign="middle" align="center"/>
<th valign="middle" align="center"/>
<th valign="middle" align="center"/>
<th valign="middle" align="center">0.687</th>
</tr>
<tr>
<td valign="middle" align="left">Yes</td>
<td valign="middle" align="center">21 (7.61)</td>
<td valign="middle" align="center">16 (8.29)</td>
<td valign="middle" align="center">5 (6.02)</td>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="middle" align="left">No</td>
<td valign="middle" align="center">255 (92.39)</td>
<td valign="middle" align="center">177 (91.71)</td>
<td valign="middle" align="center">78 (93.98)</td>
<td valign="middle" align="center"/>
</tr>
<tr>
<th valign="middle" align="left">Unclear boundary (%)</th>
<th valign="middle" align="center"/>
<th valign="middle" align="center"/>
<th valign="middle" align="center"/>
<th valign="middle" align="center">1.000</th>
</tr>
<tr>
<td valign="middle" align="left">Yes</td>
<td valign="middle" align="center">227 (82.25)</td>
<td valign="middle" align="center">159 (82.38)</td>
<td valign="middle" align="center">68 (81.93)</td>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="middle" align="left">No</td>
<td valign="middle" align="center">49 (17.75)</td>
<td valign="middle" align="center">34 (17.62)</td>
<td valign="middle" align="center">15 (18.07)</td>
<td valign="middle" align="center"/>
</tr>
<tr>
<th valign="middle" align="left">Irregular shape (%)</th>
<th valign="middle" align="center"/>
<th valign="middle" align="center"/>
<th valign="middle" align="center"/>
<th valign="middle" align="center">0.532</th>
</tr>
<tr>
<td valign="middle" align="left">Yes</td>
<td valign="middle" align="center">58 (21.01)</td>
<td valign="middle" align="center">43 (22.28)</td>
<td valign="middle" align="center">15 (18.07)</td>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="middle" align="left">No</td>
<td valign="middle" align="center">218 (78.99)</td>
<td valign="middle" align="center">150 (77.72)</td>
<td valign="middle" align="center">68 (81.93)</td>
<td valign="middle" align="center"/>
</tr>
<tr>
<th valign="middle" align="left">Microcalcification (%)</th>
<th valign="middle" align="center"/>
<th valign="middle" align="center"/>
<th valign="middle" align="center"/>
<th valign="middle" align="center">1.000</th>
</tr>
<tr>
<td valign="middle" align="left">Yes</td>
<td valign="middle" align="center">44 (15.94)</td>
<td valign="middle" align="center">31 (16.06)</td>
<td valign="middle" align="center">13 (15.66)</td>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="middle" align="left">No</td>
<td valign="middle" align="center">232 (84.06)</td>
<td valign="middle" align="center">162 (83.94)</td>
<td valign="middle" align="center">70 (84.34)</td>
<td valign="middle" align="center"/>
</tr>
<tr>
<th valign="middle" align="left">Calcification (%)</th>
<th valign="middle" align="center"/>
<th valign="middle" align="center"/>
<th valign="middle" align="center"/>
<th valign="middle" align="center">0.643</th>
</tr>
<tr>
<td valign="middle" align="left">No calcification</td>
<td valign="middle" align="center">159 (57.61)</td>
<td valign="middle" align="center">112 (58.03)</td>
<td valign="middle" align="center">47 (56.63)</td>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="middle" align="left">Microcalcification</td>
<td valign="middle" align="center">69 (25.00)</td>
<td valign="middle" align="center">50 (25.91)</td>
<td valign="middle" align="center">19 (22.89)</td>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="middle" align="left">Macrocalcification</td>
<td valign="middle" align="center">48 (17.39)</td>
<td valign="middle" align="center">31 (16.06)</td>
<td valign="middle" align="center">17 (20.48)</td>
<td valign="middle" align="center"/>
</tr>
<tr>
<th valign="middle" align="left">Halo (%)</th>
<th valign="middle" align="center"/>
<th valign="middle" align="center"/>
<th valign="middle" align="center"/>
<th valign="middle" align="center">0.384</th>
</tr>
<tr>
<td valign="middle" align="left">Present</td>
<td valign="middle" align="center">32 (11.59)</td>
<td valign="middle" align="center">25 (12.95)</td>
<td valign="middle" align="center">7 (8.43)</td>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="middle" align="left">Absent</td>
<td valign="middle" align="center">244 (88.41)</td>
<td valign="middle" align="center">168 (87.05)</td>
<td valign="middle" align="center">76 (91.57)</td>
<td valign="middle" align="center"/>
</tr>
<tr>
<th valign="middle" align="left">Orientation (%)</th>
<th valign="middle" align="center"/>
<th valign="middle" align="center"/>
<th valign="middle" align="center"/>
<th valign="middle" align="center">0.853</th>
</tr>
<tr>
<td valign="middle" align="left">Taller-than-wide</td>
<td valign="middle" align="center">129 (46.74)</td>
<td valign="middle" align="center">89 (46.11)</td>
<td valign="middle" align="center">40 (48.19)</td>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="middle" align="left">Wider-than-tall</td>
<td valign="middle" align="center">147 (53.26)</td>
<td valign="middle" align="center">104 (53.89)</td>
<td valign="middle" align="center">43 (51.81)</td>
<td valign="middle" align="center"/>
</tr>
<tr>
<th valign="middle" align="left">Upper region (%)</th>
<th valign="middle" align="center"/>
<th valign="middle" align="center"/>
<th valign="middle" align="center"/>
<th valign="middle" align="center">0.733</th>
</tr>
<tr>
<td valign="middle" align="left">Yes</td>
<td valign="middle" align="center">58 (21.01)</td>
<td valign="middle" align="center">39 (20.21)</td>
<td valign="middle" align="center">19 (22.89)</td>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="middle" align="left">No</td>
<td valign="middle" align="center">218 (78.99)</td>
<td valign="middle" align="center">154 (79.79)</td>
<td valign="middle" align="center">64 (77.11)</td>
<td valign="middle" align="center"/>
</tr>
<tr>
<th valign="middle" align="left">Nodule Position 2(%)</th>
<th valign="middle" align="center"/>
<th valign="middle" align="center"/>
<th valign="middle" align="center"/>
<th valign="middle" align="center">0.835</th>
</tr>
<tr>
<td valign="middle" align="left">Upper region</td>
<td valign="middle" align="center">58 (21.01)</td>
<td valign="middle" align="center">39 (20.21)</td>
<td valign="middle" align="center">19 (22.89)</td>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="middle" align="left">Middle region</td>
<td valign="middle" align="center">135 (48.91)</td>
<td valign="middle" align="center">93 (48.19)</td>
<td valign="middle" align="center">42 (50.60)</td>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="middle" align="left">Lower region</td>
<td valign="middle" align="center">73 (26.45)</td>
<td valign="middle" align="center">53 (27.46)</td>
<td valign="middle" align="center">20 (24.10)</td>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="middle" align="left">Isthmus</td>
<td valign="middle" align="center">10 (3.62)</td>
<td valign="middle" align="center">8 (4.15)</td>
<td valign="middle" align="center">2 (2.41)</td>
<td valign="middle" align="center"/>
</tr>
<tr>
<th valign="middle" align="left">CDFI pattern (%)</th>
<th valign="middle" align="center"/>
<th valign="middle" align="center"/>
<th valign="middle" align="center"/>
<th valign="middle" align="center">0.988</th>
</tr>
<tr>
<td valign="middle" align="left">Present</td>
<td valign="middle" align="center">65 (23.55)</td>
<td valign="middle" align="center">46 (23.83)</td>
<td valign="middle" align="center">19 (22.89)</td>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="middle" align="left">Absent</td>
<td valign="middle" align="center">211 (76.45)</td>
<td valign="middle" align="center">147 (76.17)</td>
<td valign="middle" align="center">64 (77.11)</td>
<td valign="middle" align="center"/>
</tr>
<tr>
<th valign="middle" align="left">Echotexture (%)</th>
<th valign="middle" align="center"/>
<th valign="middle" align="center"/>
<th valign="middle" align="center"/>
<th valign="middle" align="center">0.168</th>
</tr>
<tr>
<td valign="middle" align="left">Homogeneous</td>
<td valign="middle" align="center">98 (35.51)</td>
<td valign="middle" align="center">63 (32.64)</td>
<td valign="middle" align="center">35 (42.17)</td>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="middle" align="left">Heterogeneous</td>
<td valign="middle" align="center">178 (64.49)</td>
<td valign="middle" align="center">130 (67.36)</td>
<td valign="middle" align="center">48 (57.83)</td>
<td valign="middle" align="center"/>
</tr>
<tr>
<th valign="middle" align="left">Posterior features (%)</th>
<th valign="middle" align="center"/>
<th valign="middle" align="center"/>
<th valign="middle" align="center"/>
<th valign="middle" align="center">0.546</th>
</tr>
<tr>
<td valign="middle" align="left">Present</td>
<td valign="middle" align="center">65 (23.55)</td>
<td valign="middle" align="center">43 (22.28)</td>
<td valign="middle" align="center">22 (26.51)</td>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="middle" align="left">Absent</td>
<td valign="middle" align="center">211 (76.45)</td>
<td valign="middle" align="center">150 (77.72)</td>
<td valign="middle" align="center">61 (73.49)</td>
<td valign="middle" align="center"/>
</tr>
<tr>
<th valign="middle" align="left">Shadowing Posterior features (%)</th>
<th valign="middle" align="center"/>
<th valign="middle" align="center"/>
<th valign="middle" align="center"/>
<th valign="middle" align="center">1.000</th>
</tr>
<tr>
<td valign="middle" align="left">Yes</td>
<td valign="middle" align="center">75 (27.17)</td>
<td valign="middle" align="center">52 (26.94)</td>
<td valign="middle" align="center">23 (27.71)</td>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="middle" align="left">No</td>
<td valign="middle" align="center">201 (72.83)</td>
<td valign="middle" align="center">141 (73.06)</td>
<td valign="middle" align="center">60 (72.29)</td>
<td valign="middle" align="center"/>
</tr>
<tr>
<th valign="middle" align="left">Suspicious LN (%)</th>
<th valign="middle" align="center"/>
<th valign="middle" align="center"/>
<th valign="middle" align="center"/>
<th valign="middle" align="center">0.269</th>
</tr>
<tr>
<td valign="middle" align="left">Yes</td>
<td valign="middle" align="center">100 (36.23)</td>
<td valign="middle" align="center">68 (35.23)</td>
<td valign="middle" align="center">32 (38.55)</td>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="middle" align="left">No</td>
<td valign="middle" align="center">176 (63.77)</td>
<td valign="middle" align="center">125 (64.77)</td>
<td valign="middle" align="center">50 (61.45)</td>
<td valign="middle" align="center"/>
</tr>
<tr>
<th valign="middle" align="left">TI-RADS (%)</th>
<th valign="middle" align="center"/>
<th valign="middle" align="center"/>
<th valign="middle" align="center"/>
<th valign="middle" align="center">0.425</th>
</tr>
<tr>
<td valign="middle" align="left">3</td>
<td valign="middle" align="center">53(19.20)</td>
<td valign="middle" align="center">39 (20.21)</td>
<td valign="middle" align="center">14(16.87)</td>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="middle" align="left">4a</td>
<td valign="middle" align="center">102(36.96)</td>
<td valign="middle" align="center">64(33.16)</td>
<td valign="middle" align="center">38(45.78)</td>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="middle" align="left">4b</td>
<td valign="middle" align="center">78(28.26)</td>
<td valign="middle" align="center">57(29.53)</td>
<td valign="middle" align="center">21(25.30)</td>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="middle" align="left">4c</td>
<td valign="middle" align="center">29(10.51)</td>
<td valign="middle" align="center">22(11.40)</td>
<td valign="middle" align="center">7(8.43)</td>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="middle" align="left">5</td>
<td valign="middle" align="center">14(5.07)</td>
<td valign="middle" align="center">11 (5.70)</td>
<td valign="middle" align="center">3 (3.61)</td>
<td valign="middle" align="center"/>
</tr>
<tr>
<th valign="middle" align="left">Solitary nodule (%)</th>
<th valign="middle" align="center"/>
<th valign="middle" align="center"/>
<th valign="middle" align="center"/>
<th valign="middle" align="center">0.395</th>
</tr>
<tr>
<td valign="middle" align="left">Yes</td>
<td valign="middle" align="center">112 (40.58)</td>
<td valign="middle" align="center">82 (42.49)</td>
<td valign="middle" align="center">30 (36.14)</td>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="middle" align="left">No</td>
<td valign="middle" align="center">164 (59.42)</td>
<td valign="middle" align="center">111 (57.51)</td>
<td valign="middle" align="center">53 (63.86)</td>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="middle" align="left">TSH (median [IQR])</td>
<td valign="middle" align="center">1.76 [1.08;2.58]</td>
<td valign="middle" align="center">1.77 [1.03;2.58]</td>
<td valign="middle" align="center">1.74 [1.11;2.55]</td>
<td valign="middle" align="center">0.745</td>
</tr>
<tr>
<td valign="middle" align="left">FT4(median [IQR])</td>
<td valign="middle" align="center">13.58 [11.63;16.24]</td>
<td valign="middle" align="center">13.68 [11.70;16.60]</td>
<td valign="middle" align="center">13.40 [11.59;15.64]</td>
<td valign="middle" align="center">0.199</td>
</tr>
<tr>
<td valign="middle" align="left">FT3(median [IQR])</td>
<td valign="middle" align="center">4.49 [4.07;5.01]</td>
<td valign="middle" align="center">4.48 [4.10;5.01]</td>
<td valign="middle" align="center">4.50 [4.02;5.00]</td>
<td valign="middle" align="center">0.882</td>
</tr>
<tr>
<td valign="middle" align="left">TgAb (median [IQR])</td>
<td valign="middle" align="center">7.61 [1.15;19.88]</td>
<td valign="middle" align="center">10.80 [1.22;20.50]</td>
<td valign="middle" align="center">3.28 [1.00;18.45]</td>
<td valign="middle" align="center">0.130</td>
</tr>
<tr>
<td valign="middle" align="left">TPOAb (median [IQR])</td>
<td valign="middle" align="center">7.08 [1.00;14.98]</td>
<td valign="middle" align="center">9.00 [1.04;15.50]</td>
<td valign="middle" align="center">2.13 [1.00;12.70]</td>
<td valign="middle" align="center">0.173</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>CDFI, Color Doppler Flow Imaging; LN, Lymph Node; TI-RADS, Thyroid Imaging Reporting and Data System; TSH, Thyroid-Stimulating Hormone; FT4, Free Thyroxine; FT3, Free Triiodothyronine; TgAb, Thyroglobulin Antibody; TPOAb, Thyroid Peroxidase Antibody.</p>
</fn>
</table-wrap-foot>
</table-wrap>
</sec>
<sec id="s3_2">
<label>3.2</label>
<title>Selection of clinical characteristics</title>
<p>The predictor variables selected by the six methods are presented in <xref ref-type="table" rid="T2">
<bold>Table&#xa0;2</bold>
</xref>. Detailed parameters for all methods (SR-FS, SR-BS, SR-BE, LASSO, Boruta and RF-RFE) can be found in <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S4</bold>
</xref> and <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figures S3</bold>
</xref>-<xref ref-type="supplementary-material" rid="SM1">
<bold>S5</bold>
</xref>. A total of 10, 6, 6, 5, 8, and 10 predictors were identified using the six selection methods. As shown in <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S4</bold>
</xref>, variables such as TSH, FT4, and Echotexture did not show a significant association with malignancy in the initial univariate screening and were therefore not carried forward into the final model building stage. <xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1</bold>
</xref> illustrates the intersection of predictors selected by the six methods. Predictors with more than six intersections were selected as final predictors, including BRAF, composition, shape, orientation, and TI-RADS. Ultimately, five predictors were included in the development of the model.</p>
<table-wrap id="T2" position="float">
<label>Table&#xa0;2</label>
<caption>
<p>Predictor variables of Bethesda III nodules using different selection methods.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" align="left">Methods</th>
<th valign="middle" align="left">Predictor variables</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="left">SR-FS</td>
<td valign="middle" align="left">AUS, BRAF, Size, Composition, Echogenicity, Margin, Shape, Orientation, TI-RADS, TgAb</td>
</tr>
<tr>
<td valign="middle" align="left">SR-BE</td>
<td valign="middle" align="left">BRAF, Composition, Shape, Orientation, TI-RADS, TgAb</td>
</tr>
<tr>
<td valign="middle" align="left">SR-BS</td>
<td valign="middle" align="left">BRAF, Composition, Shape, Orientation, TI-RADS, TgAb</td>
</tr>
<tr>
<td valign="middle" align="left">LASSO</td>
<td valign="middle" align="left">BRAF, Composition, Shape, Orientation, TI-RADS</td>
</tr>
<tr>
<td valign="middle" align="left">Boruta</td>
<td valign="middle" align="left">BRAF, Size, Composition, Margin, Shape, Orientation, TI-RADS, TgAb</td>
</tr>
<tr>
<td valign="middle" align="left">RF-RFE</td>
<td valign="middle" align="left">BRAF, Size, Composition, Shape, Orientation, TI-RADS, TgAb, TSH, FT4, Echotexture</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>SR-FS, stepwise regression-forward selection; SR-BS, stepwise regression-backward selection; SR-BE, stepwise regression-bidirectional elimination; LASSO, least absolute shrinkage and selection operator; RF-RFE, random forest feature elimination; AUS, Atypia of Undetermined Significance; TI-RADS, Thyroid Imaging Reporting and Data System; TSH, Thyroid-Stimulating Hormone; FT4, Free Thyroxine; TgAb, Thyroglobulin Antibody.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<fig id="f1" position="float">
<label>Figure&#xa0;1</label>
<caption>
<p>Upset plot of interactions between the predictors. <bold>(A)</bold> BRAF, composition, shape, orientation, TI-RADS. <bold>(B)</bold> TSH, FT4, Echotexture. <bold>(C)</bold> AUS, Echogenicity. <bold>(D)</bold> Size. <bold>(E)</bold> Margin. <bold>(F)</bold> TgAb. SR-FS, stepwise regression-forward selection; SR-BS, stepwise regression-backward selection; SR-BE, stepwise regression-bidirectional elimination; LASSO, least absolute shrinkage and selection operator; RF-RFE, random forest -recursive feature elimination.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fendo-16-1655828-g001.tif">
<alt-text content-type="machine-generated">Bar chart showing the number of intersections for predictors A to F. A has the highest with five intersections, followed by B with three, and C with two. D, E, and F each have one. A legend shows color-coded bars for RF-RFE, Boruta, LASSO, SR-BS, SR-BE, and SR-FS, indicating the number of predictors ranging from five to ten.</alt-text>
</graphic>
</fig>
</sec>
<sec id="s3_3">
<label>3.3</label>
<title>Performances of different models</title>
<p>In our comparative analysis, we evaluated five machine learning models against the LR model. Although complex models such as RF achieved better training set performance, the LR model exhibited the most robust and clinically meaningful results in the validation set, as evidenced by <xref ref-type="table" rid="T3">
<bold>Table&#xa0;3</bold>
</xref> and <xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2</bold>
</xref>. The six models were developed using six distinct machine learning algorithms. The estimated odds ratios for the logistic regression model are presented in <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S5</bold>
</xref> and visualized in a forest plot (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figure S6</bold>
</xref>). We further illustrate visualizations for the other models, including the relative importance of potential features and heatmaps of confusion matrices for the decision tree, random forest, extreme gradient boosting, support vector machine, and k-nearest neighbors models derived from the training cohort. However, due to the nature of the KNN model, the ranking of feature importance is not applicable in this case.</p>
<table-wrap id="T3" position="float">
<label>Table&#xa0;3</label>
<caption>
<p>Predictive performance metrics of different machine learning algorithms of the training set and validation set.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" align="left">Model</th>
<th valign="middle" align="left">LR</th>
<th valign="middle" align="left">DT</th>
<th valign="middle" align="left">RF</th>
<th valign="middle" align="left">XGB</th>
<th valign="middle" align="left">SVM</th>
<th valign="middle" align="left">KNN</th>
</tr>
</thead>
<tbody>
<tr>
<th valign="middle" colspan="7" align="left">Training set</th>
</tr>
<tr>
<td valign="middle" align="center">AUC (95%)</td>
<td valign="middle" align="left">0.89 (0.84-0.93)</td>
<td valign="middle" align="left">0.83 (0.77-0.89)</td>
<td valign="middle" align="left">0.92 (0.89-0.96)</td>
<td valign="middle" align="left">0.90 (0.86-0.95)</td>
<td valign="middle" align="left">0.88 (0.83-0.93)</td>
<td valign="middle" align="left">0.90 (0.86-0.94)</td>
</tr>
<tr>
<td valign="middle" align="center">SEN</td>
<td valign="middle" align="left">0.92</td>
<td valign="middle" align="left">0.87</td>
<td valign="middle" align="left">0.78</td>
<td valign="middle" align="left">0.82</td>
<td valign="middle" align="left">0.73</td>
<td valign="middle" align="left">0.79</td>
</tr>
<tr>
<td valign="middle" align="center">SPE</td>
<td valign="middle" align="left">0.70</td>
<td valign="middle" align="left">0.71</td>
<td valign="middle" align="left">0.91</td>
<td valign="middle" align="left">0.85</td>
<td valign="middle" align="left">0.85</td>
<td valign="middle" align="left">0.84</td>
</tr>
<tr>
<td valign="middle" align="center">PPV</td>
<td valign="middle" align="left">0.85</td>
<td valign="middle" align="left">0.83</td>
<td valign="middle" align="left">0.94</td>
<td valign="middle" align="left">0.91</td>
<td valign="middle" align="left">0.90</td>
<td valign="middle" align="left">0.90</td>
</tr>
<tr>
<td valign="middle" align="center">NPV</td>
<td valign="middle" align="left">0.82</td>
<td valign="middle" align="left">0.76</td>
<td valign="middle" align="left">0.69</td>
<td valign="middle" align="left">0.71</td>
<td valign="middle" align="left">0.63</td>
<td valign="middle" align="left">0.68</td>
</tr>
<tr>
<td valign="middle" align="center">ACC</td>
<td valign="middle" align="left">0.85</td>
<td valign="middle" align="left">0.83</td>
<td valign="middle" align="left">0.94</td>
<td valign="middle" align="left">0.91</td>
<td valign="middle" align="left">0.90</td>
<td valign="middle" align="left">0.90</td>
</tr>
<tr>
<td valign="middle" align="center">F1 score</td>
<td valign="middle" align="left">0.89</td>
<td valign="middle" align="left">0.85</td>
<td valign="middle" align="left">0.85</td>
<td valign="middle" align="left">0.86</td>
<td valign="middle" align="left">0.81</td>
<td valign="middle" align="left">0.84</td>
</tr>
<tr>
<td valign="middle" align="center">Brier score</td>
<td valign="middle" align="left">0.13</td>
<td valign="middle" align="left">0.15</td>
<td valign="middle" align="left">0.11</td>
<td valign="middle" align="left">0.12</td>
<td valign="middle" align="left">0.13</td>
<td valign="middle" align="left">0.14</td>
</tr>
<tr>
<th valign="middle" colspan="7" align="left">Validation set</th>
</tr>
<tr>
<td valign="middle" align="center">AUC (95%)</td>
<td valign="middle" align="left">0.82 (0.73-0.92)</td>
<td valign="middle" align="left">0.76 (0.66-0.86)</td>
<td valign="middle" align="left">0.79 (0.69-0.89)</td>
<td valign="middle" align="left">0.82 (0.72-0.91)</td>
<td valign="middle" align="left">0.82 (0.73-0.91)</td>
<td valign="middle" align="left">0.77 (0.67-0.87)</td>
</tr>
<tr>
<td valign="middle" align="center">SEN</td>
<td valign="middle" align="left">0.85</td>
<td valign="middle" align="left">0.82</td>
<td valign="middle" align="left">0.70</td>
<td valign="middle" align="left">0.74</td>
<td valign="middle" align="left">0.63</td>
<td valign="middle" align="left">0.80</td>
</tr>
<tr>
<td valign="middle" align="center">SPE</td>
<td valign="middle" align="left">0.55</td>
<td valign="middle" align="left">0.61</td>
<td valign="middle" align="left">0.72</td>
<td valign="middle" align="left">0.72</td>
<td valign="middle" align="left">0.86</td>
<td valign="middle" align="left">0.59</td>
</tr>
<tr>
<td valign="middle" align="center">PPV</td>
<td valign="middle" align="left">0.78</td>
<td valign="middle" align="left">0.76</td>
<td valign="middle" align="left">0.83</td>
<td valign="middle" align="left">0.83</td>
<td valign="middle" align="left">0.90</td>
<td valign="middle" align="left">0.78</td>
</tr>
<tr>
<td valign="middle" align="center">NPV</td>
<td valign="middle" align="left">0.67</td>
<td valign="middle" align="left">0.69</td>
<td valign="middle" align="left">0.57</td>
<td valign="middle" align="left">0.60</td>
<td valign="middle" align="left">0.56</td>
<td valign="middle" align="left">0.61</td>
</tr>
<tr>
<td valign="middle" align="center">ACC</td>
<td valign="middle" align="left">0.78</td>
<td valign="middle" align="left">0.76</td>
<td valign="middle" align="left">0.83</td>
<td valign="middle" align="left">0.83</td>
<td valign="middle" align="left">0.90</td>
<td valign="middle" align="left">0.78</td>
</tr>
<tr>
<td valign="middle" align="center">F1 score</td>
<td valign="middle" align="left">0.81</td>
<td valign="middle" align="left">0.79</td>
<td valign="middle" align="left">0.76</td>
<td valign="middle" align="left">0.78</td>
<td valign="middle" align="left">0.74</td>
<td valign="middle" align="left">0.79</td>
</tr>
<tr>
<td valign="middle" align="center">Brier score</td>
<td valign="middle" align="left">0.16</td>
<td valign="middle" align="left">0.19</td>
<td valign="middle" align="left">0.21</td>
<td valign="middle" align="left">0.16</td>
<td valign="middle" align="left">0.16</td>
<td valign="middle" align="left">0.23</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>DT, decision tree; KNN, k-nearest neighbors; LR, logistic regression; RF, random forest; SVM, support vector machine; XGB, XGBoost; AUC, area under curve; SEN, sensitivity; SPE, specificity; PPV, positive predictive value; NPV, negative predictive value; ACC, accuracy.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<fig id="f2" position="float">
<label>Figure&#xa0;2</label>
<caption>
<p>Performance comparison of different machine learning models in the training set and validation set. <bold>(A)</bold> ROC curves in the training set. <bold>(B)</bold> ROC curves in the validation set. <bold>(C)</bold> Calibration curves in the training set. <bold>(D)</bold> Calibration curves in the validation set. <bold>(E)</bold> DCA results in the training set. <bold>(F)</bold> DCA results in the validation set. <bold>(A, B)</bold> The dotted lines in the ROC curves represent the reference line. <bold>(C, D)</bold> The dotted lines in the calibration curves represent a perfect prediction by an ideal model. <bold>(E, F)</bold> The &#x201c;treat all&#x201d; lines in the DCA results assume that all nodules were malignant, whereas the &#x201c;treat none&#x201d; lines assume that all nodules were benign lesions. Abbreviations: DT, decision tree; AUC, area under curve; KNN, k-nearest neighbors; LR, logistic regression; RF, random forest; SVM, support vector machine; XGB, XGBoost; ROC, receiver operating characteristic; DCA, Decision Curve Analysis.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fendo-16-1655828-g002.tif">
<alt-text content-type="machine-generated">Six charts display model performance metrics for training and validation sets. A and B show ROC curves, illustrating sensitivity versus specificity for different models. C and D present calibration curves, comparing predicted versus observed probabilities. E and F depict decision curve analysis results, highlighting net benefit across thresholds for various models: DT, KNN, LR, RF, SVM, and XGB.</alt-text>
</graphic>
</fig>
<p>The RF model demonstrated the highest area under the ROC curve (AUC, 0.923; 95% CI: 0.887&#x2013;0.959) in the training set (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2A</bold>
</xref>), whereas the LR model achieved the highest AUC (0.823; 95% CI: 0.732&#x2013;0.915) in the validation set (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2B</bold>
</xref>). The AUC values for the remaining models in the validation set were as follows: (1) DT: 0.758, 95% CI: 0.657&#x2013;0.859; (2) RF: 0.792, 95% CI: 0.694&#x2013;0.890; (3) XGB: 0.817, 95% CI: 0.722&#x2013;0.912; (4) SVM: 0.822, 95% CI: 0.730&#x2013;0.913; (5) KNN: 0.771, 95% CI: 0.668&#x2013;0.873 (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2B</bold>
</xref>). Based on the DeLong test (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Tables S7</bold>
</xref>, <xref ref-type="supplementary-material" rid="SM1">
<bold>S8</bold>
</xref>), no significant difference in AUC was observed in the validation cohort. This may be due to the limited sample size or the similar performance of the models.</p>
<p>The DT model showed the best consistency between observed and predicted results in both the training and validation sets (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2C</bold>
</xref>). In contrast, the LR, SVM, KNN, and XGB models exhibited similarly good consistency between observed and predicted results in the validation set (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2D</bold>
</xref>). The consistency between observed and predicted results in the RF model was less stable in the validation set (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2D</bold>
</xref>).</p>
<p>In the training set, all models demonstrated similar DCA results (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2E</bold>
</xref>), whereas the LR, SVM, and XGB models achieved the best DCA outcomes in the validation set (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2F</bold>
</xref>). In the validation set, using alternative models resulted in a greater net benefit compared to no treatment or full treatment strategies when the threshold probability was &lt;80%.</p>
<p>The RF model exhibited the highest precision and specificity in the training set, whereas the LR model achieved the highest recall and F1 score, as well as the second lowest Brier score. In the validation set, the LR model achieved the highest recall and F1 score, whereas the SVM model demonstrated the highest precision. Detailed information can be found in <xref ref-type="table" rid="T3">
<bold>Table&#xa0;3</bold>
</xref>. Model performance in the validation set served as the primary criterion for identifying the optimal model. Although the LR model exhibited moderate specificity (0.55), its superior AUC (0.823), recall (sensitivity, 0.85), and F1 score (0.81) justified its selection as the optimal model. For malignancy risk assessment, minimizing false negatives through high recall remains clinically critical.</p>
<p>In summary, while the RF model may exhibit potential overfitting, the LR model demonstrates not only strong interpretability but also achieves the highest AUC in the validation set. Taking into account model performance, complexity, generalization capability, and practicality, the LR model was ultimately chosen. The forest plot illustrates variables with P-values greater than 0.05 (composition), and due to its clinical significance in daily medical practice, this variable was retained in the logistic regression model for interpretation of its effect size.</p>
</sec>
<sec id="s3_4">
<label>3.4</label>
<title>Nomogram construction and application</title>
<p>The nomogram was constructed by incorporating five variables&#x2014;BRAF, composition, shape, orientation, and TI-RADS&#x2014;into the predictive model (<xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3</bold>
</xref>). Following 500 bootstrap iterations, the LR model demonstrated an AUC of 0.871 (95% CI: 0.817&#x2013;0.926) in the training set and 0.846 (95% CI: 0.762&#x2013;0.930) in the validation set (<xref ref-type="fig" rid="f4">
<bold>Figures&#xa0;4A, B</bold>
</xref>). After 500 bootstrap iterations for calibration, the calibration curve closely aligned with the ideal diagonal. The average absolute errors (MAEs) for the two datasets were 0.013 and 0.031, respectively, indicating that the predicted probabilities closely aligned with the actual outcomes across different samples (<xref ref-type="fig" rid="f4">
<bold>Figures&#xa0;4C, D</bold>
</xref>). The Hosmer-Lemeshow test confirmed good consistency between the predicted and observed results (P = 0.414). DCA showed that applying the LR nomogram provided greater net benefit than no treatment or full treatment strategies when the threshold probability ranged from 16% to 96% in the training set and from 15% to 95% in the validation set (<xref ref-type="fig" rid="f4">
<bold>Figures&#xa0;4E, F</bold>
</xref>). Using this model, clinicians can more accurately assess the risk of malignancy in Bethesda III nodules, providing optimized management and treatment options. The integration of this predictive model significantly enhances the precision of patient management. This highlights the importance of leveraging precise, data-driven decisions in clinical practice. We further assessed the independence of the variables in the model by calculating the VIF and found that all VIF values were well below the common threshold of 5, indicating low multicollinearity and confirming the model&#x2019;s stability and reliability. The detailed VIF values are provided in <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S6</bold>
</xref>. Our analysis compared the ROC curves of the nomogram with those of the five individual predictors for malignancy risk assessment. The nomogram exhibited superior diagnostic performance, as illustrated in <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figure S14</bold>
</xref>.</p>
<fig id="f3" position="float">
<label>Figure&#xa0;3</label>
<caption>
<p>
<bold>(A)</bold> Nomogram used for predicting the risk of malignancy for Bethesda III nodules. Logistic regression algorithm was used to establish nomogram. The final score (ie, Total Points) is calculated as the sum of the individual scores of each of the ten variables included in the nomogram. <bold>(B)</bold> A web-based calculator for predicting malignancy risk in Bethesda III nodules. Abbreviations: TI-RADS, Thyroid Imaging Reporting and Data System.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fendo-16-1655828-g003.tif">
<alt-text content-type="machine-generated">A two-part image depicting diagnostic tools for predicting medical conditions. Part A shows a nomogram used for calculating risk based on factors like BRAF mutation, solid composition, shape, orientation, and TI-RADS with a point scale from zero to three hundred. Part B displays the AUS Nomogram Predictor interface with sliders for BRAF, composition, shape, orientation, and RADS, along with a graph for visualizing probability of disease response with confidence intervals. Model predictions include a probability of 0.915 with specific upper and lower bounds.</alt-text>
</graphic>
</fig>
<fig id="f4" position="float">
<label>Figure&#xa0;4</label>
<caption>
<p>Performance of the logistic regression model with 500 bootstraps. <bold>(A)</bold> ROC curves in the training set. <bold>(B)</bold> ROC curves in the validation set. <bold>(C)</bold> Calibration curves in the training set. <bold>(D)</bold> Calibration curves in the validation set. <bold>(E)</bold> DCA results in the training set. <bold>(F)</bold> DCA results in the validation set. <bold>(A, B)</bold> The diagonal lines in the ROC curves represent the reference line; the &#x201c;Apparent ROC&#x201d; lines represent the apparent performance of the model, whereas the &#x201c;Bootstrap ROC&#x201d; lines represent the model&#x2019;s performance after 500 bootstraps. <bold>(C, D)</bold> The dotted lines in the calibration curves represent a perfect prediction by an ideal model; the &#x201c;Apparent&#x201d; lines denote the apparent performance of the model, whereas the &#x201c;Bias-corrected&#x201d; lines reflect the model&#x2019;s performance after 500 bootstraps; a closer fit to the dotted lines indicates a better predictive effect. <bold>(E, F)</bold> The &#x201c;treat all&#x201d; lines in the DCA results assume that all nodules were malignant, whereas the &#x201c;treat none&#x201d; lines assume that all nodules were benign lesions; the &#x201c;Nomo model&#x201d; lines represent the performance of the model. For example, if a patient&#x2019;s threshold probability is 75%, the net benefit is approximately 0.3 in the validation set, meaning that 30 out of 100 patients may benefit from using this model. ROC, receiver operating characteristic; DCA, Decision Curve Analysis.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fendo-16-1655828-g004.tif">
<alt-text content-type="machine-generated">Six panels showing performance metrics for predictive models. Panels A and B are ROC curves comparing apparent and bootstrap ROC, showing high accuracy. Panels C and D are calibration curves displaying actual versus predicted probabilities with ideal, apparent, and bias-corrected lines. Panels E and F are decision curves illustrating net benefit across threshold probabilities for treating all, treating none, and using a nomogram model. Each graph has distinct features highlighting performance and calibration across various thresholds and probabilities.</alt-text>
</graphic>
</fig>
<p>Compared to the complex logistic regression formula, the nomogram is simpler, more intuitive, and clinically practical. To use the nomogram, a line is drawn from the value of each feature to the &#x201c;points&#x201d; axis, obtaining the corresponding score. After summing these points, the total score is located on the &#x201c;total points&#x201d; axis. Finally, a line is drawn downward from the total score to the &#x201c;probability of malignancy&#x201d; axis to determine the corresponding risk. For example, when a patient is BRAF-positive with an ultrasound indicating a solid nodule, a regular shape, a vertical-to-horizontal ratio &lt;1, and a TI-RADS score of 4a, their &#x201c;BRAF&#x201d; score is 91, &#x201c;composition&#x201d; is 32, &#x201c;shape&#x201d; is 0, &#x201c;orientation&#x201d; is 0, and &#x201c;TI-RADS&#x201d; is 24. The total score is 147, corresponding to a malignancy probability of 0.72 (72%). Therefore, the surgeon may consider this patient at high risk for Bethesda III nodules malignancy and recommend diagnostic lobectomy (<xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3A</bold>
</xref>).</p>
<p>To support clinical implementation of this predictive model, we developed a web-based calculator that enables physicians to input patient-specific clinical data and immediately obtain malignancy risk estimates for Bethesda III nodules, thereby supporting more informed clinical decisions. The tool streamlines risk assessment while facilitating personalized patient management through individualized risk stratification. The calculator is publicly accessible online at <ext-link ext-link-type="uri" xlink:href="https://13583155338-l.shinyapps.io/PredictionofAUS/">https://13583155338-l.shinyapps.io/PredictionofAUS/</ext-link> (<xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3B</bold>
</xref>).</p>
</sec>
</sec>
<sec id="s4" sec-type="discussion">
<label>4</label>
<title>Discussion</title>
<p>According to the 2023 TBSRTC, the estimated malignant risk for Bethesda III nodules ranges from 10% to 30%, but recent studies report a significantly higher malignancy rate than predicted (<xref ref-type="bibr" rid="B5">5</xref>, <xref ref-type="bibr" rid="B7">7</xref>, <xref ref-type="bibr" rid="B33">33</xref>). More importantly, after being informed of the 10-30% malignancy risk and receiving follow-up treatment recommendations for US-FNA, these cases show higher rates of inconclusive results (up to 60%) on repeat FNA (<xref ref-type="bibr" rid="B34">34</xref>, <xref ref-type="bibr" rid="B35">35</xref>). Although several studies have addressed this challenge, most focus on specific factors, with few providing comprehensive clinical, ultrasound, genetic, and pathological data. Additionally, many studies are limited by small sample sizes due to the absence of comprehensive postoperative pathological data, hindering their ability to conduct balanced research or only allowing for one-sided conclusions. Ahn, H. S. et&#xa0;al. (<xref ref-type="bibr" rid="B23">23</xref>) included surgical and repeat biopsy results to analyze nodule characteristics. By combining ultrasound features, nodule size, and cytological subtypes, they provided more accurate malignancy risk stratification for Bethesda III nodules. Ahmadi, S. et&#xa0;al. (<xref ref-type="bibr" rid="B36">36</xref>) observed 141 Bethesda III nodules with multigene testing and 12 months of ultrasound follow-up. The study showed a 100% negative predictive value, demonstrating the feasibility of follow-up using multigene testing for these nodules. Numerous studies have shown that multigene testing achieves a negative predictive value close to 100% in follow-up observation of Bethesda III nodules, proving its feasibility (<xref ref-type="bibr" rid="B37">37</xref>, <xref ref-type="bibr" rid="B38">38</xref>). Therefore, we innovatively included Bethesda III nodules with surgical pathology, repeat biopsy, and multigene testing. We then compared logistic regression and five ML models to predict and analyze the malignancy risk of Bethesda III nodules, ultimately selecting logistic regression as the ideal model for developing predictive models and nomograms.</p>
<p>Due to the lack of standardized guidelines or consensus for feature selection in predictive models, it remains unclear how many features should be included in the model. Relevant risk variables often exhibit correlations, and multicollinearity can cause issues such as overfitting and computational complexity. To address this, we applied six feature selection methods to the study population, aiming to reduce the high correlation between predictors and capture the complex relationships with outcome variables.</p>
<p>We selected BRAF, composition, shape, orientation, and TI-RADS, with BRAF identified as the most significant predictor. The standalone BRAF V600E test has become a relatively cost-effective and routine preoperative tool in many tertiary hospitals across China. In this study, the odds ratio (OR) for BRAF was 17, and the BRAF V600E mutation rate in patients diagnosed with Bethesda III nodules and ultimately confirmed to have PTC reached 87.93% (<xref ref-type="bibr" rid="B39">39</xref>). However, BRAF for malignancy detection in the Bethesda III nodules population has a sensitivity of only 30%-40%. Research by Paspala, A. et&#xa0;al. (<xref ref-type="bibr" rid="B40">40</xref>) found that the detection rate of BRAF mutations in Bethesda III is lower than in Bethesda V/VI, suggesting its greater utility for stratification in high-risk subgroups but also its limitations in Bethesda III nodules. When BRAF is negative, gene testing cannot predict whether Bethesda III nodules are benign or malignant, with a negative predictive value of 38.1%-52.6% (<xref ref-type="bibr" rid="B39">39</xref>, <xref ref-type="bibr" rid="B41">41</xref>). Therefore, malignancy prediction in Bethesda III nodules requires a combined approach that integrates ultrasound characteristics for improved diagnostic accuracy (<xref ref-type="bibr" rid="B42">42</xref>, <xref ref-type="bibr" rid="B43">43</xref>). Composition, shape, and orientation are independent imaging risk factors for thyroid nodules and should be incorporated into predictive models for Bethesda III nodules malignancy. Jin, L. et&#xa0;al. (<xref ref-type="bibr" rid="B44">44</xref>) demonstrated that spatial heterogeneity in malignant nodules, quantified by ultrasound contrast enhancement, was significantly higher. Ultrasound findings of nodules with blurred margins, lobulated, or irregular contours suggest a higher likelihood of malignancy in Bethesda III nodules (<xref ref-type="bibr" rid="B45">45</xref>, <xref ref-type="bibr" rid="B46">46</xref>). Thyroid nodule taller-than-wide (TTW) feature is a strong predictor of malignancy. Studies have shown that a shape with TTW yields a diagnostic accuracy of up to 83%, with a specificity of 73% (<xref ref-type="bibr" rid="B47">47</xref>). Additionally, combining composition, shape, orientation, and other ultrasound features significantly enhances both sensitivity and specificity in diagnosis (<xref ref-type="bibr" rid="B43">43</xref>, <xref ref-type="bibr" rid="B48">48</xref>).</p>
<p>This study also included a subgroup analysis of Bethesda III nodules and examined the correlation between thyroid function and the benign or malignant nature of Bethesda III nodules. The findings show that the atypical nuclear category significantly differs from other categories in multiple aspects. First, the risk of malignancy (ROM) in cases with atypical nuclei is significantly higher than in cases with architectural atypia. Categorizing Bethesda III cases into nuclear atypia and architectural atypia subgroups may improve ROM stratification (<xref ref-type="bibr" rid="B49">49</xref>). Second, the proportion of malignant tumors in Bethesda III nodules increases with higher TI-RADS classifications, though no such difference is observed in FLUS (<xref ref-type="bibr" rid="B45">45</xref>). Moreover, both nuclear and architectural atypia subcategories in AUS exhibit high ROM, classifying them into high-risk groups (<xref ref-type="bibr" rid="B50">50</xref>, <xref ref-type="bibr" rid="B51">51</xref>). Therefore, this study categorized pathological features into nuclear and architectural atypia. Unfortunately, neither cytological atypia subtype showed statistical significance in predicting malignancy in our analysis. This result is likely attributable to the limited sample size in the subgroups, particularly for nuclear atypia, which resulted in insufficient statistical power to detect a potential difference. The 2023 TBSRTC revision has streamlined subcategorization into two classifications: AUS-nuclear and AUS-other. This modification indirectly demonstrates the limitations of relying solely on traditional cytological subtypes for predicting malignancy risk, as subcategorization alone cannot provide sufficient clinical decision-making support. Future studies will seek to increase the sample size to investigate the relationship between pathological subtypes and the malignancy rate of Bethesda III nodules. The study found significant differences in TgAb levels between benign and malignant nodules, suggesting its potential role in preoperative malignancy diagnosis. Retrospective studies in Chinese patients showed that the TgAb positivity rate was significantly higher in PTC patients than in those with benign thyroid nodules, suggesting a potential link to malignant tumor occurrence (<xref ref-type="bibr" rid="B52">52</xref>).</p>
<p>In the era of big data, machine learning models for predicting clinical events have become increasingly important. Clinical EMR data is relatively objective, accurate, and easily accessible for clinicians and researchers. Combining EMR data with complex machine learning algorithms facilitates the development of clinical prediction models (<xref ref-type="bibr" rid="B53">53</xref>). This study demonstrates the capabilities of various machine learning models in predicting the benign or malignant nature of Bethesda III nodules and aims to identify the most suitable algorithm based on the dataset&#x2019;s characteristics and the study&#x2019;s objectives. Different machine learning algorithms have distinct principles, strengths, and applicable scenarios, but also limitations and biases. LR are traditional classification algorithms suited for linear relationships but sensitive to outliers. Decision trees, based on tree structures, are prone to overfitting and noise sensitivity. Random forests, using simple averaging or voting strategies, require significant computational resources and have poor interpretability. SVM optimize objective functions to find the optimal hyperplane but incur high computational costs and require careful parameter tuning. XGB, employing gradient boosting, requires long training times and extensive hyperparameter tuning. KNN are computationally intensive and struggle with high-dimensional data (<xref ref-type="bibr" rid="B54">54</xref>&#x2013;<xref ref-type="bibr" rid="B56">56</xref>). In this study, the LR model achieved an AUC of 0.823 in the validation set, with superior sensitivity, recall, and F1 scores compared to more complex models, demonstrating its practical significance. When the primary goal is to analyze the relationship between outcomes and risk factors, especially with small datasets, traditional methods like logistic regression may be sufficient (<xref ref-type="bibr" rid="B57">57</xref>). This finding supports the argument that machine learning does not always outperform LR in predictive modelling (<xref ref-type="bibr" rid="B58">58</xref>). Additionally, the generalizability of the models, assessed through five-fold cross-validation, indicates that they can handle unseen data and reliably perform risk assessments in new clinical contexts. This comprehensive approach improved the predictive accuracy of the models and enhanced their reliability in practical applications.</p>
<p>The LR model outperformed others in discriminative ability, calibration, and clinical net benefit. The newly developed LR model, which integrates easily accessible pathological, ultrasound, and clinical features, performed well, with an AUC of 0.823 in the validation set. Besides AUC, we evaluated the LR model&#x2019;s performance using other metrics, including precision, recall, F1 score, and Brier score. Due to its simple structure, the LR model excelled, demonstrating outstanding interpretability and high performance across these key metrics. The LR model&#x2019;s higher F1 score reflects a reasonable balance between precision and recall, minimizing both false positives and false negatives, which is critical for clinical decision-making. The calibration plot showed good agreement between predicted and actual values. More importantly, decision curve analysis revealed that the LR model provides substantial clinical net benefit, supporting clinical decision-making. In terms of applicability, the LR model is characterized by its simple structure and high interpretability. However, the differences in predictive performance across models were not significant, likely due to the limited sample size of the validation set. Considering its interpretability, calibration, clinical utility, and potential for further analysis, the LR model remains the optimal choice. Additionally, incorporating AUS subtypes and thyroid function tests into the model may improve its predictive performance. The model&#x2019;s low specificity inevitably increases false-positive rates in clinical settings. While these false positives may prompt additional diagnostic procedures, they rarely result in immediate radical interventions. Decision curve analysis confirms that despite this limitation, the model prevents more unnecessary procedures than it generates when benchmarked against universal treatment strategies. In addition, we recommend that future studies incorporate additional pathological and biochemical clinical data to potentially improve predictive outcomes.</p>
<p>This study developed a nomogram, which was evaluated through 500 bootstrap iterations and assessed for predictive performance using several goodness-of-fit tests, including the Hosmer&#x2013;Lemeshow test, AUC-ROC, calibration curve, and DCA. The Hosmer&#x2013;Lemeshow test showed good agreement between predicted and observed values (P = 0.414). The observed AUC difference (&#x394; = 0.025) between the training and validation cohorts indicates that the sample size is adequate to assess the model&#x2019;s general applicability and effectiveness. The calibration curve also showed strong consistency between predicted and actual outcomes, underscoring the model&#x2019;s reliability. Furthermore, the DCA results demonstrated that across a wide range of probability thresholds, the nomogram consistently offered greater clinical benefit than universal treatment or no treatment. Previous studies have also developed nomograms to predict the benign or malignant nature of Bethesda III nodules using systematic risk factors. Yoon, J. H. et&#xa0;al. (<xref ref-type="bibr" rid="B15">15</xref>) reported a nomogram with an AUC of 0.754 but did not evaluate its applicability using DCA. &#xd6;cal, B. et&#xa0;al. (<xref ref-type="bibr" rid="B59">59</xref>) reported an AUC of 0.784 in the validation set, although their dataset included uncertain nodules from Bethesda III, IV, and V categories. Zhong, L. et&#xa0;al. (<xref ref-type="bibr" rid="B16">16</xref>) described a nomogram with an AUC of 0.823, but its applicability was more limited, with a threshold probability range of 21% to 70%. Cao, Y. et&#xa0;al.0 (<xref ref-type="bibr" rid="B14">14</xref>) reported a nomogram with an AUC of 0.80, comparing two machine learning methods to traditional logistic regression. The nomogram developed in this study has an AUC higher than those reported in the aforementioned studies and shows broader applicability in DCA. Moreover, these previous studies employed only logistic regression or a few machine learning algorithms, without comparing them to a broader range of machine learning models. As a result, this study is more innovative and comprehensive. By using this nomogram, clinicians can accurately predict the benign or malignant nature of Bethesda III nodules, thus guiding clinical decision-making.</p>
<p>This study has several limitations. First, although robust internal validation through cross-validation and bootstrap methods strengthened the methodological rigor, the lack of external validation with an independent cohort remains a significant limitation. The single-center, retrospective nature of our dataset may introduce selection bias, and the small sample size could lead to overfitting in machine learning models, limiting the model&#x2019;s generalizability across clinical practices with varying demographic characteristics, institutions, and regions. To address this limitation, future research should prioritize multicenter collaborations to validate and optimize the model in diverse settings, ensuring broader clinical applicability. Second, while our case selection included Bethesda III nodules patients followed up in outpatient settings without surgery, we did not conduct prospective follow-up for all patients. We used BRAF mutation analysis as part of routine preoperative testing, but did not include the 12-gene panel in the routine screening, which may have caused discrepancies in molecular analysis results. Patients who underwent surgery, repeat FNA, or molecular testing likely represent a higher-risk subset compared to those managed conservatively. Although the 12-gene test and repeat biopsy have nearly 100% negative predictive value, biases may still arise due to the relatively short follow-up period. Furthermore, we acknowledge that the minimum six-month follow-up period for non-surgical cases may be insufficient to capture all slow-growing malignancies. Future studies should prioritize long-term follow-up and include these additional mutations to enhance the comprehensiveness and accuracy of the predictive model. Third, our study cohort presented a malignancy rate of 65.2%, which is substantially higher than the 13-30% rate typically estimated for Bethesda III nodules. Consequently, our model was trained on a higher-risk population than is typically encountered in general clinical practice. Fourth, our study did not employ an exhaustive hyperparameter tuning process, such as grid search or random search, for the more complex machine learning models like Random Forest and XGBoost. Lastly, inter-observer variability in the interpretation of US and FNAB results may occur. In conclusion, of the six machine learning algorithms evaluated, LR demonstrated the best performance in this study.</p>
<p>Consequently, a logistic regression-based nomogram was developed to predict the benign or malignant nature of Bethesda III nodules. Future studies should focus on further prospective external validation to assess whether follow-up strategies based on the final predictive model can effectively predict the benign or malignant nature of Bethesda III nodules.</p>
</sec>
</body>
<back>
<sec id="s5" sec-type="data-availability">
<title>Data availability statement</title>
<p>The raw data supporting the conclusions of this article will be made available by the authors, without undue reservation.</p>
</sec>
<sec id="s6" sec-type="ethics-statement">
<title>Ethics statement</title>
<p>The studies involving humans were approved by the 960th Hospital of the PLA Joint Logistics Support Force Research Ethics Committee. The studies were conducted in accordance with the local legislation and institutional requirements. The participants provided their written informed consent to participate in this study.</p>
</sec>
<sec id="s7" sec-type="author-contributions">
<title>Author contributions</title>
<p>WL: Data curation, Formal analysis, Writing &#x2013; original draft. JZ: Data curation, Formal analysis, Writing &#x2013; review &amp; editing. YW: Supervision, Validation, Writing &#x2013; original draft. JL: Visualization, Resources, Software, Supervision, Writing &#x2013; review &amp; editing. ZL: Resources, Software, Visualization, Writing &#x2013; review &amp; editing. CW: Data curation, Resources, Software, Writing &#x2013; review &amp; editing. JX: Resources, Software, Writing &#x2013; review &amp; editing. PZ: Funding acquisition, Supervision, Validation, Visualization, Writing &#x2013; review &amp; editing. QH: Funding acquisition, Resources, Software, Supervision, Validation, Writing &#x2013; review &amp; editing.</p>
</sec>
<sec id="s8" sec-type="funding-information">
<title>Funding</title>
<p>The author(s) declare financial support was received for the research and/or publication of this article. This work was supported by the Key Medical Discipline Project of Joint Logistics Support Force of the People&#x2019;s Liberation Army of China, Key Discipline Project of Shandong Province Medical and Health and Shandong Second Medical University Affiliated Hospital (Teaching Hospital) Scientific Research Development Fund Project(2024FYM107).</p>
</sec>
<ack>
<title>Acknowledgments</title>
<p>This study was generously supported by Jingding Medical Tech, to whom we extend our sincere gratitude. We especially thank them for providing authorization and technical support for the JD_DCPM software. The team at Jingding Medical Tech offered invaluable assistance in data processing.</p>
</ack>
<sec id="s9" sec-type="COI-statement">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec id="s10" sec-type="ai-statement">
<title>Generative AI statement</title>
<p>The author(s) declare that no Generative AI was used in the creation of this manuscript.</p>
<p>Any alternative text (alt text) provided alongside figures in this article has been generated by Frontiers with the support of artificial intelligence and reasonable efforts have been made to ensure accuracy, including review by the authors wherever possible. If you identify any issues, please contact us.</p>
</sec>
<sec id="s11" sec-type="disclaimer">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec id="s12" sec-type="supplementary-material">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fendo.2025.1655828/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fendo.2025.1655828/full#supplementary-material</ext-link>
</p>
<supplementary-material xlink:href="SupplementaryFile1.pdf" id="SM1" mimetype="application/pdf"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<label>1</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Durante</surname> <given-names>C</given-names>
</name>
<name>
<surname>Grani</surname> <given-names>G</given-names>
</name>
<name>
<surname>Lamartina</surname> <given-names>L</given-names>
</name>
<name>
<surname>Filetti</surname> <given-names>S</given-names>
</name>
<name>
<surname>Mandel</surname> <given-names>SJ</given-names>
</name>
<name>
<surname>Cooper</surname> <given-names>DS</given-names>
</name>
</person-group>. <article-title>The diagnosis and management of thyroid nodules: A review</article-title>. <source>JAMA</source>. (<year>2018</year>) <volume>319</volume>:<page-range>914&#x2013;24</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1001/jama.2018.0898</pub-id>, PMID: <pub-id pub-id-type="pmid">29509871</pub-id></citation></ref>
<ref id="B2">
<label>2</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Grani</surname> <given-names>G</given-names>
</name>
<name>
<surname>Sponziello</surname> <given-names>M</given-names>
</name>
<name>
<surname>Filetti</surname> <given-names>S</given-names>
</name>
<name>
<surname>Durante</surname> <given-names>C</given-names>
</name>
</person-group>. <article-title>Thyroid nodules: Diagnosis and management</article-title>. <source>Nat Rev Endocrinol</source>. (<year>2024</year>) <volume>20</volume>:<page-range>715&#x2013;28</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41574-024-01025-4</pub-id>, PMID: <pub-id pub-id-type="pmid">39152228</pub-id></citation></ref>
<ref id="B3">
<label>3</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ali</surname> <given-names>SZ</given-names>
</name>
<name>
<surname>Baloch</surname> <given-names>ZW</given-names>
</name>
<name>
<surname>Cochand-Priollet</surname> <given-names>B</given-names>
</name>
<name>
<surname>Schmitt</surname> <given-names>FC</given-names>
</name>
<name>
<surname>Vielh</surname> <given-names>P</given-names>
</name>
<name>
<surname>VanderLaan</surname> <given-names>PA</given-names>
</name>
</person-group>. <article-title>The 2023 Bethesda system for reporting thyroid cytopathology</article-title>. <source>Thyroid</source>. (<year>2023</year>) <volume>33</volume>:<page-range>1039&#x2013;44</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1089/thy.2023.0141</pub-id>, PMID: <pub-id pub-id-type="pmid">37427847</pub-id></citation></ref>
<ref id="B4">
<label>4</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hassan</surname> <given-names>I</given-names>
</name>
<name>
<surname>Hassan</surname> <given-names>L</given-names>
</name>
<name>
<surname>Balalaa</surname> <given-names>N</given-names>
</name>
<name>
<surname>Askar</surname> <given-names>M</given-names>
</name>
<name>
<surname>Alshehhi</surname> <given-names>H</given-names>
</name>
<name>
<surname>Almarzooqi</surname> <given-names>M</given-names>
</name>
<etal/>
</person-group>. <article-title>The incidence of thyroid cancer in Bethesda III thyroid nodules: A retrospective analysis at a single endocrine surgery center</article-title>. <source>Diagnostics (Basel)</source>. (<year>2024</year>) <volume>14</volume>, <fpage>1026</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/diagnostics14101026</pub-id>, PMID: <pub-id pub-id-type="pmid">38786324</pub-id></citation></ref>
<ref id="B5">
<label>5</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pasha</surname> <given-names>HA</given-names>
</name>
<name>
<surname>Dhanani</surname> <given-names>R</given-names>
</name>
<name>
<surname>Mughal</surname> <given-names>A</given-names>
</name>
<name>
<surname>Ahmed</surname> <given-names>KS</given-names>
</name>
<name>
<surname>Suhail</surname> <given-names>A</given-names>
</name>
</person-group>. <article-title>Malignancy rate in thyroid nodules with atypia or follicular lesion of undetermined significance</article-title>. <source>Int Arch Otorhinolaryngol</source>. (<year>2020</year>) <volume>24</volume>:<page-range>e221&#x2013;26</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1055/s-0039-1698784</pub-id>, PMID: <pub-id pub-id-type="pmid">32256845</pub-id></citation></ref>
<ref id="B6">
<label>6</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jiragawasan</surname> <given-names>C</given-names>
</name>
<name>
<surname>Himakhun</surname> <given-names>W</given-names>
</name>
</person-group>. <article-title>The risk of Malignancy in the atypia of undetermined significance/follicular lesion of undetermined significance (AUS/FLUS) category subgroups: A Thai institute experience</article-title>. <source>J Am Soc Cytopathol</source>. (<year>2024</year>) <volume>13</volume>:<fpage>16</fpage>&#x2013;<lpage>22</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.jasc.2023.09.006</pub-id>, PMID: <pub-id pub-id-type="pmid">37903698</pub-id></citation></ref>
<ref id="B7">
<label>7</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yoo</surname> <given-names>WS</given-names>
</name>
<name>
<surname>Ahn</surname> <given-names>HY</given-names>
</name>
<name>
<surname>Ahn</surname> <given-names>HS</given-names>
</name>
<name>
<surname>Chung</surname> <given-names>YJ</given-names>
</name>
<name>
<surname>Kim</surname> <given-names>HS</given-names>
</name>
<name>
<surname>Cho</surname> <given-names>BY</given-names>
</name>
<etal/>
</person-group>. <article-title>Malignancy rate of Bethesda category III thyroid nodules according to ultrasound risk stratification system and cytological subtype</article-title>. <source>Med (Baltimore)</source>. (<year>2020</year>) <volume>99</volume>:<elocation-id>e18780</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1097/md.0000000000018780</pub-id>, PMID: <pub-id pub-id-type="pmid">31914102</pub-id></citation></ref>
<ref id="B8">
<label>8</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Raghunathan</surname> <given-names>R</given-names>
</name>
<name>
<surname>Longstaff</surname> <given-names>XR</given-names>
</name>
<name>
<surname>Hughes</surname> <given-names>EG</given-names>
</name>
<name>
<surname>Li</surname> <given-names>SJ</given-names>
</name>
<name>
<surname>Sant</surname> <given-names>VR</given-names>
</name>
<name>
<surname>Tseng</surname> <given-names>CH</given-names>
</name>
<etal/>
</person-group>. <article-title>Diagnostic performance of molecular testing in indeterminate (Bethesda III and IV) thyroid nodules with H&#xfc;rthle cell cytology</article-title>. <source>Surgery</source>. (<year>2024</year>) <volume>175</volume>:<page-range>221&#x2013;27</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.surg.2023.05.046</pub-id>, PMID: <pub-id pub-id-type="pmid">37926582</pub-id></citation></ref>
<ref id="B9">
<label>9</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Geng</surname> <given-names>J</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>H</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Tai</surname> <given-names>J</given-names>
</name>
<name>
<surname>Jin</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>J</given-names>
</name>
<etal/>
</person-group>. <article-title>Correlation between BRAF (V600E) mutation and clinicopathological features in pediatric papillary thyroid carcinoma</article-title>. <source>Sci China Life Sci</source>. (<year>2017</year>) <volume>60</volume>:<page-range>729&#x2013;38</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s11427-017-9083-8</pub-id>, PMID: <pub-id pub-id-type="pmid">28646474</pub-id></citation></ref>
<ref id="B10">
<label>10</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fakhruddin</surname> <given-names>N</given-names>
</name>
<name>
<surname>Jabbour</surname> <given-names>M</given-names>
</name>
<name>
<surname>Novy</surname> <given-names>M</given-names>
</name>
<name>
<surname>Tamim</surname> <given-names>H</given-names>
</name>
<name>
<surname>Bahmad</surname> <given-names>H</given-names>
</name>
<name>
<surname>Farhat</surname> <given-names>F</given-names>
</name>
<etal/>
</person-group>. <article-title>BRAF and NRAS mutations in papillary thyroid carcinoma and concordance in BRAF mutations between primary and corresponding lymph node metastases</article-title>. <source>Sci Rep</source>. (<year>2017</year>) <volume>7</volume>:<fpage>4666</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41598-017-04948-3</pub-id>, PMID: <pub-id pub-id-type="pmid">28680105</pub-id></citation></ref>
<ref id="B11">
<label>11</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sapio</surname> <given-names>MR</given-names>
</name>
<name>
<surname>Posca</surname> <given-names>D</given-names>
</name>
<name>
<surname>Troncone</surname> <given-names>G</given-names>
</name>
<name>
<surname>Pettinato</surname> <given-names>G</given-names>
</name>
<name>
<surname>Palombini</surname> <given-names>L</given-names>
</name>
<name>
<surname>Rossi</surname> <given-names>G</given-names>
</name>
<etal/>
</person-group>. <article-title>Detection of BRAF mutation in thyroid papillary carcinomas by mutant allele-specific PCR amplification (MASA)</article-title>. <source>Eur J Endocrinol</source>. (<year>2006</year>) <volume>154</volume>:<page-range>341&#x2013;8</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1530/eje.1.02072</pub-id>, PMID: <pub-id pub-id-type="pmid">16452550</pub-id></citation></ref>
<ref id="B12">
<label>12</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nikiforov</surname> <given-names>YE</given-names>
</name>
<name>
<surname>Ohori</surname> <given-names>NP</given-names>
</name>
<name>
<surname>Hodak</surname> <given-names>SP</given-names>
</name>
<name>
<surname>Carty</surname> <given-names>SE</given-names>
</name>
<name>
<surname>LeBeau</surname> <given-names>SO</given-names>
</name>
<name>
<surname>Ferris</surname> <given-names>RL</given-names>
</name>
<etal/>
</person-group>. <article-title>Impact of mutational testing on the diagnosis and management of patients with cytologically indeterminate thyroid nodules: A prospective analysis of 1056 FNA samples</article-title>. <source>J Clin Endocrinol Metab</source>. (<year>2011</year>) <volume>96</volume>:<page-range>3390&#x2013;7</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1210/jc.2011-1469</pub-id>, PMID: <pub-id pub-id-type="pmid">21880806</pub-id></citation></ref>
<ref id="B13">
<label>13</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Patel</surname> <given-names>KN</given-names>
</name>
<name>
<surname>Angell</surname> <given-names>TE</given-names>
</name>
<name>
<surname>Babiarz</surname> <given-names>J</given-names>
</name>
<name>
<surname>Barth</surname> <given-names>NM</given-names>
</name>
<name>
<surname>Blevins</surname> <given-names>T</given-names>
</name>
<name>
<surname>Duh</surname> <given-names>QY</given-names>
</name>
<etal/>
</person-group>. <article-title>Performance of a genomic sequencing classifier for the preoperative diagnosis of cytologically indeterminate thyroid nodules</article-title>. <source>JAMA Surg</source>. (<year>2018</year>) <volume>153</volume>:<page-range>817&#x2013;24</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1001/jamasurg.2018.1153</pub-id>, PMID: <pub-id pub-id-type="pmid">29799911</pub-id></citation></ref>
<ref id="B14">
<label>14</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cao</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Luan</surname> <given-names>M</given-names>
</name>
<name>
<surname>Hu</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>L</given-names>
</name>
<etal/>
</person-group>. <article-title>Optimizing thyroid AUS nodules Malignancy prediction: A comprehensive study of logistic regression and machine learning models</article-title>. <source>Front Endocrinol (Lausanne)</source>. (<year>2024</year>) <volume>15</volume>:<elocation-id>1366687</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fendo.2024.1366687</pub-id>, PMID: <pub-id pub-id-type="pmid">39568807</pub-id></citation></ref>
<ref id="B15">
<label>15</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yoon</surname> <given-names>JH</given-names>
</name>
<name>
<surname>Lee</surname> <given-names>HS</given-names>
</name>
<name>
<surname>Kim</surname> <given-names>EK</given-names>
</name>
<name>
<surname>Moon</surname> <given-names>HJ</given-names>
</name>
<name>
<surname>Kwak</surname> <given-names>JY</given-names>
</name>
</person-group>. <article-title>A nomogram for predicting Malignancy in thyroid nodules diagnosed as atypia of undetermined significance/follicular lesions of undetermined significance on fine needle aspiration</article-title>. <source>Surgery</source>. (<year>2014</year>) <volume>155</volume>:<page-range>1006&#x2013;13</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.surg.2013.12.035</pub-id>, PMID: <pub-id pub-id-type="pmid">24630147</pub-id></citation></ref>
<ref id="B16">
<label>16</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhong</surname> <given-names>L</given-names>
</name>
<name>
<surname>Shi</surname> <given-names>L</given-names>
</name>
<name>
<surname>Lai</surname> <given-names>J</given-names>
</name>
<name>
<surname>Hu</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Gu</surname> <given-names>L</given-names>
</name>
</person-group>. <article-title>Combined model integrating clinical, radiomics, BRAF(V600E) and ultrasound for differentiating between benign and Malignant indeterminate cytology (Bethesda III) thyroid nodules: A bi-center retrospective study</article-title>. <source>Gland Surg</source>. (<year>2024</year>) <volume>13</volume>:<page-range>1954&#x2013;64</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.21037/gs-24-310</pub-id>, PMID: <pub-id pub-id-type="pmid">39678423</pub-id></citation></ref>
<ref id="B17">
<label>17</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wu</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Rao</surname> <given-names>K</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>J</given-names>
</name>
<name>
<surname>Han</surname> <given-names>C</given-names>
</name>
<name>
<surname>Gong</surname> <given-names>L</given-names>
</name>
<name>
<surname>Chong</surname> <given-names>Y</given-names>
</name>
<etal/>
</person-group>. <article-title>Machine learning algorithms for the prediction of central lymph node metastasis in patients with papillary thyroid cancer</article-title>. <source>Front Endocrinol (Lausanne)</source>. (<year>2020</year>) <volume>11</volume>:<elocation-id>577537</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fendo.2020.577537</pub-id>, PMID: <pub-id pub-id-type="pmid">33193092</pub-id></citation></ref>
<ref id="B18">
<label>18</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yao</surname> <given-names>J</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Lei</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>K</given-names>
</name>
<name>
<surname>Li</surname> <given-names>X</given-names>
</name>
<name>
<surname>Zhou</surname> <given-names>J</given-names>
</name>
<etal/>
</person-group>. <article-title>AI-generated content enhanced computer-aided diagnosis model for thyroid nodules: A chatGPT-style assistant</article-title>. <source>arXiv preprint arXiv</source>. (<year>2024</year>) <volume>2402</volume>:<elocation-id>2401</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.48550/arXiv.2402.02401</pub-id>
</citation></ref>
<ref id="B19">
<label>19</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yao</surname> <given-names>J</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Lei</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>K</given-names>
</name>
<name>
<surname>Feng</surname> <given-names>N</given-names>
</name>
<name>
<surname>Dong</surname> <given-names>F</given-names>
</name>
<etal/>
</person-group>. <article-title>Multimodal GPT model for assisting thyroid nodule diagnosis and management</article-title>. <source>NPJ Digit Med</source>. (<year>2025</year>) <volume>8</volume>:<fpage>245</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41746-025-01652-9</pub-id>, PMID: <pub-id pub-id-type="pmid">40319170</pub-id></citation></ref>
<ref id="B20">
<label>20</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yao</surname> <given-names>J</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Shen</surname> <given-names>J</given-names>
</name>
<name>
<surname>Lei</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Xiong</surname> <given-names>J</given-names>
</name>
<name>
<surname>Feng</surname> <given-names>B</given-names>
</name>
<etal/>
</person-group>. <article-title>AI diagnosis of Bethesda category IV thyroid nodules</article-title>. <source>iScience</source>. (<year>2023</year>) <volume>26</volume>:<page-range>108&#x2013;7</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.isci.2023.108114</pub-id>, PMID: <pub-id pub-id-type="pmid">37867955</pub-id></citation></ref>
<ref id="B21">
<label>21</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gupta</surname> <given-names>A</given-names>
</name>
<name>
<surname>Bajaj</surname> <given-names>S</given-names>
</name>
<name>
<surname>Nema</surname> <given-names>P</given-names>
</name>
<name>
<surname>Purohit</surname> <given-names>A</given-names>
</name>
<name>
<surname>Kashaw</surname> <given-names>V</given-names>
</name>
<name>
<surname>Soni</surname> <given-names>V</given-names>
</name>
<etal/>
</person-group>. <article-title>Potential of AI and ML in oncology research including diagnosis, treatment and future directions: A comprehensive prospective</article-title>. <source>Comput Biol Med</source>. (<year>2025</year>) <volume>189</volume>:<elocation-id>109918</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.compbiomed.2025.109918</pub-id>, PMID: <pub-id pub-id-type="pmid">40037170</pub-id></citation></ref>
<ref id="B22">
<label>22</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Collins</surname> <given-names>GS</given-names>
</name>
<name>
<surname>Moons</surname> <given-names>KGM</given-names>
</name>
<name>
<surname>Dhiman</surname> <given-names>P</given-names>
</name>
<name>
<surname>Riley</surname> <given-names>RD</given-names>
</name>
<name>
<surname>Beam</surname> <given-names>AL</given-names>
</name>
<name>
<surname>Van Calster</surname> <given-names>B</given-names>
</name>
<etal/>
</person-group>. <article-title>TRIPOD+AI statement: Updated guidance for reporting clinical prediction models that use regression or machine learning methods</article-title>. <source>BMJ</source>. (<year>2024</year>) <volume>385</volume>:<elocation-id>e078378</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1136/bmj-2023-078378</pub-id>, PMID: <pub-id pub-id-type="pmid">38626948</pub-id></citation></ref>
<ref id="B23">
<label>23</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ahn</surname> <given-names>HS</given-names>
</name>
<name>
<surname>Na</surname> <given-names>DG</given-names>
</name>
<name>
<surname>Kim</surname> <given-names>JH</given-names>
</name>
</person-group>. <article-title>Risk stratification of thyroid nodules diagnosed as Bethesda category III by ultrasound, size, and cytology</article-title>. <source>Korean J Radiol</source>. (<year>2024</year>) <volume>25</volume>:<page-range>924&#x2013;33</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.3348/kjr.2024.0292</pub-id>, PMID: <pub-id pub-id-type="pmid">39344549</pub-id></citation></ref>
<ref id="B24">
<label>24</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhou</surname> <given-names>J</given-names>
</name>
<name>
<surname>Yin</surname> <given-names>L</given-names>
</name>
<name>
<surname>Wei</surname> <given-names>X</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>S</given-names>
</name>
<name>
<surname>Song</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Luo</surname> <given-names>B</given-names>
</name>
<etal/>
</person-group>. <article-title>2020 Chinese guidelines for ultrasound Malignancy risk stratification of thyroid nodules: The C-TIRADS</article-title>. <source>Endocrine</source>. (<year>2020</year>) <volume>70</volume>:<page-range>256&#x2013;79</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s12020-020-02441-y</pub-id>, PMID: <pub-id pub-id-type="pmid">32827126</pub-id></citation></ref>
<ref id="B25">
<label>25</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Vittinghoff</surname> <given-names>E</given-names>
</name>
<name>
<surname>McCulloch</surname> <given-names>CE</given-names>
</name>
</person-group>. <article-title>Relaxing the rule of ten events per variable in logistic and Cox regression</article-title>. <source>Am J Epidemiol</source>. (<year>2007</year>) <volume>165</volume>:<page-range>710&#x2013;8</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/aje/kwk052</pub-id>, PMID: <pub-id pub-id-type="pmid">17182981</pub-id></citation></ref>
<ref id="B26">
<label>26</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>van Smeden</surname> <given-names>M</given-names>
</name>
<name>
<surname>Moons</surname> <given-names>KGM</given-names>
</name>
<name>
<surname>de Groot</surname> <given-names>JA</given-names>
</name>
<name>
<surname>Collins</surname> <given-names>GS</given-names>
</name>
<name>
<surname>Altman</surname> <given-names>DG</given-names>
</name>
<name>
<surname>Eijkemans</surname> <given-names>MJ</given-names>
</name>
<etal/>
</person-group>. <article-title>Sample size for binary logistic prediction models: Beyond events per variable criteria</article-title>. <source>Stat Methods Med Res</source>. (<year>2019</year>) <volume>28</volume>:<page-range>2455&#x2013;74</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1177/0962280218784726</pub-id>, PMID: <pub-id pub-id-type="pmid">29966490</pub-id></citation></ref>
<ref id="B27">
<label>27</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yuan</surname> <given-names>X</given-names>
</name>
<name>
<surname>Xu</surname> <given-names>Q</given-names>
</name>
<name>
<surname>Du</surname> <given-names>F</given-names>
</name>
<name>
<surname>Gao</surname> <given-names>X</given-names>
</name>
<name>
<surname>Guo</surname> <given-names>J</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>J</given-names>
</name>
<etal/>
</person-group>. <article-title>Development and validation of a model to predict cognitive impairment in traumatic brain injury patients: A prospective observational study</article-title>. <source>EClinicalMedicine</source>. (<year>2025</year>) <volume>80</volume>:<elocation-id>103023</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.eclinm.2024.103023</pub-id>, PMID: <pub-id pub-id-type="pmid">39850016</pub-id></citation></ref>
<ref id="B28">
<label>28</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Riley</surname> <given-names>RD</given-names>
</name>
<name>
<surname>Ensor</surname> <given-names>J</given-names>
</name>
<name>
<surname>Snell</surname> <given-names>KIE</given-names>
</name>
<name>
<surname>Harrell</surname> <given-names>FE</given-names>
<suffix>Jr</suffix>
</name>
<name>
<surname>Martin</surname> <given-names>GP</given-names>
</name>
<name>
<surname>Reitsma</surname> <given-names>JB</given-names>
</name>
<etal/>
</person-group>. <article-title>Calculating the sample size required for developing a clinical prediction model</article-title>. <source>BMJ</source>. (<year>2020</year>) <volume>368</volume>:<elocation-id>m441</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1136/bmj.m441</pub-id>, PMID: <pub-id pub-id-type="pmid">32188600</pub-id></citation></ref>
<ref id="B29">
<label>29</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dong</surname> <given-names>J</given-names>
</name>
<name>
<surname>Jin</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Li</surname> <given-names>C</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>J</given-names>
</name>
<name>
<surname>Jiang</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Li</surname> <given-names>Z</given-names>
</name>
<etal/>
</person-group>. <article-title>Machine learning models with prognostic implications for predicting gastrointestinal bleeding after coronary artery bypass grafting and guiding personalized medicine: Multicenter cohort study</article-title>. <source>J Med Internet Res</source>. (<year>2025</year>) <volume>27</volume>:<elocation-id>e68509</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.2196/68509</pub-id>, PMID: <pub-id pub-id-type="pmid">40053791</pub-id></citation></ref>
<ref id="B30">
<label>30</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xu</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>Q</given-names>
</name>
<name>
<surname>Zhou</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Sun</surname> <given-names>J</given-names>
</name>
<name>
<surname>Tian</surname> <given-names>G</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>C</given-names>
</name>
<etal/>
</person-group>. <article-title>Screening risk factors for the occurrence of wedge effects in intramedullary nail fixation for intertrochanteric fractures in older people via machine learning and constructing a prediction model: a retrospective study</article-title>. <source>BMC Musculoskelet Disord</source>. (<year>2025</year>) <volume>26</volume>:<fpage>403</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s12891-025-08619-7</pub-id>, PMID: <pub-id pub-id-type="pmid">40264104</pub-id></citation></ref>
<ref id="B31">
<label>31</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Qi</surname> <given-names>W</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Huang</surname> <given-names>S</given-names>
</name>
<name>
<surname>Li</surname> <given-names>C</given-names>
</name>
<name>
<surname>Jin</surname> <given-names>H</given-names>
</name>
<etal/>
</person-group>. <article-title>Prediction of postpartum depression in women: development and validation of multiple machine learning models</article-title>. <source>J Transl Med</source>. (<year>2025</year>) <volume>23</volume>:<fpage>291</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s12967-025-06289-6</pub-id>, PMID: <pub-id pub-id-type="pmid">40055720</pub-id></citation></ref>
<ref id="B32">
<label>32</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lee</surname> <given-names>S</given-names>
</name>
<name>
<surname>Gornitz</surname> <given-names>N</given-names>
</name>
<name>
<surname>Xing</surname> <given-names>EP</given-names>
</name>
<name>
<surname>Heckerman</surname> <given-names>D</given-names>
</name>
<name>
<surname>Lippert</surname> <given-names>C</given-names>
</name>
</person-group>. <article-title>Ensembles of lasso screening rules</article-title>. <source>IEEE Trans Pattern Anal Mach Intell</source>. (<year>2018</year>) <volume>40</volume>:<page-range>2841&#x2013;52</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1109/tpami.2017.2765321</pub-id>, PMID: <pub-id pub-id-type="pmid">29989981</pub-id></citation></ref>
<ref id="B33">
<label>33</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Saoud</surname> <given-names>C</given-names>
</name>
<name>
<surname>Bailey</surname> <given-names>GE</given-names>
</name>
<name>
<surname>Graham</surname> <given-names>AJ</given-names>
</name>
<name>
<surname>Maleki</surname> <given-names>Z</given-names>
</name>
</person-group>. <article-title>The Bethesda system for reporting thyroid cytopathology in the African American population: A tertiary centre experience</article-title>. <source>Cytopathology</source>. (<year>2024</year>) <volume>35</volume>:<page-range>715&#x2013;23</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/cyt.13426</pub-id>, PMID: <pub-id pub-id-type="pmid">39075743</pub-id></citation></ref>
<ref id="B34">
<label>34</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Allen</surname> <given-names>L</given-names>
</name>
<name>
<surname>Al Afif</surname> <given-names>A</given-names>
</name>
<name>
<surname>Rigby</surname> <given-names>MH</given-names>
</name>
<name>
<surname>Bullock</surname> <given-names>MJ</given-names>
</name>
<name>
<surname>Trites</surname> <given-names>J</given-names>
</name>
<name>
<surname>Taylor</surname> <given-names>SM</given-names>
</name>
<etal/>
</person-group>. <article-title>The role of repeat fine needle aspiration in managing indeterminate thyroid nodules</article-title>. <source>J Otolaryngol Head Neck Surg</source>. (<year>2019</year>) <volume>48</volume>:<fpage>16</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s40463-019-0338-7</pub-id>, PMID: <pub-id pub-id-type="pmid">30894222</pub-id></citation></ref>
<ref id="B35">
<label>35</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Papazian</surname> <given-names>MR</given-names>
</name>
<name>
<surname>Dublin</surname> <given-names>JC</given-names>
</name>
<name>
<surname>Patel</surname> <given-names>KN</given-names>
</name>
<name>
<surname>Oweity</surname> <given-names>T</given-names>
</name>
<name>
<surname>Jacobson</surname> <given-names>AS</given-names>
</name>
<name>
<surname>Brandler</surname> <given-names>TC</given-names>
</name>
<etal/>
</person-group>. <article-title>Repeat fine-needle aspiration with molecular analysis in management of indeterminate thyroid nodules</article-title>. <source>Otolaryngol Head Neck Surg</source>. (<year>2023</year>) <volume>168</volume>:<page-range>738&#x2013;44</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1177/01945998221093527</pub-id>, PMID: <pub-id pub-id-type="pmid">35412868</pub-id></citation></ref>
<ref id="B36">
<label>36</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ahmadi</surname> <given-names>S</given-names>
</name>
<name>
<surname>Kotwal</surname> <given-names>A</given-names>
</name>
<name>
<surname>Bikas</surname> <given-names>A</given-names>
</name>
<name>
<surname>Xiang</surname> <given-names>P</given-names>
</name>
<name>
<surname>Goldner</surname> <given-names>W</given-names>
</name>
<name>
<surname>Patel</surname> <given-names>A</given-names>
</name>
<etal/>
</person-group>. <article-title>Outcomes of cytologically indeterminate thyroid nodules managed with genomic sequencing classifier</article-title>. <source>J Clin Endocrinol Metab</source>. (<year>2024</year>) <volume>109</volume>:<page-range>e2231&#x2013;39</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1210/clinem/dgae112</pub-id>, PMID: <pub-id pub-id-type="pmid">38415829</pub-id></citation></ref>
<ref id="B37">
<label>37</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Steward</surname> <given-names>DL</given-names>
</name>
<name>
<surname>Carty</surname> <given-names>SE</given-names>
</name>
<name>
<surname>Sippel</surname> <given-names>RS</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>SP</given-names>
</name>
<name>
<surname>Sosa</surname> <given-names>JA</given-names>
</name>
<name>
<surname>Sipos</surname> <given-names>JA</given-names>
</name>
<etal/>
</person-group>. <article-title>Performance of a multigene genomic classifier in thyroid nodules with indeterminate cytology: A prospective blinded multicenter study</article-title>. <source>JAMA Oncol</source>. (<year>2019</year>) <volume>5</volume>:<page-range>204&#x2013;12</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1001/jamaoncol.2018.4616</pub-id>, PMID: <pub-id pub-id-type="pmid">30419129</pub-id></citation></ref>
<ref id="B38">
<label>38</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shrestha</surname> <given-names>RT</given-names>
</name>
<name>
<surname>Evasovich</surname> <given-names>MR</given-names>
</name>
<name>
<surname>Amin</surname> <given-names>K</given-names>
</name>
<name>
<surname>Radulescu</surname> <given-names>A</given-names>
</name>
<name>
<surname>Sanghvi</surname> <given-names>TS</given-names>
</name>
<name>
<surname>Nelson</surname> <given-names>AC</given-names>
</name>
<etal/>
</person-group>. <article-title>Correlation between histological diagnosis and mutational panel testing of thyroid nodules: A two-year institutional experience</article-title>. <source>Thyroid</source>. (<year>2016</year>) <volume>26</volume>:<page-range>1068&#x2013;76</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1089/thy.2016.0048</pub-id>, PMID: <pub-id pub-id-type="pmid">27283257</pub-id></citation></ref>
<ref id="B39">
<label>39</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lei</surname> <given-names>L</given-names>
</name>
<name>
<surname>Hong Qing</surname> <given-names>S</given-names>
</name>
<name>
<surname>Wei</surname> <given-names>L</given-names>
</name>
<name>
<surname>Ma Mo Yang</surname> <given-names>F</given-names>
</name>
<name>
<surname>Xiao Xiang</surname> <given-names>Y</given-names>
</name>
</person-group>. <article-title>The combined use of fine-needle aspiration (FNA) and BRAF V600E gene testing: Can it increase the definitive diagnosis rate of nodules categorized as Bethesda III for papillary thyroid carcinoma</article-title>? <source>Am Surg</source>. (<year>2024</year>) <volume>90</volume>:<page-range>3209&#x2013;15</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1177/00031348241265143</pub-id>, PMID: <pub-id pub-id-type="pmid">39047144</pub-id></citation></ref>
<ref id="B40">
<label>40</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Paspala</surname> <given-names>A</given-names>
</name>
<name>
<surname>Bompetsi</surname> <given-names>G</given-names>
</name>
<name>
<surname>Paschou</surname> <given-names>SA</given-names>
</name>
<name>
<surname>Charalambopoulos</surname> <given-names>A</given-names>
</name>
<name>
<surname>Pikoulis</surname> <given-names>E</given-names>
</name>
<name>
<surname>Peppa</surname> <given-names>M</given-names>
</name>
<etal/>
</person-group>. <article-title>The value of preoperative molecular testing in the management of Bethesda V and Bethesda VI thyroid tumors</article-title>. <source>(Hormones (Athens)</source>. (<year>2025</year>) <volume>24</volume>:<page-range>217&#x2013;29</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s42000-024-00597-0</pub-id>, PMID: <pub-id pub-id-type="pmid">39225945</pub-id></citation></ref>
<ref id="B41">
<label>41</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Oh</surname> <given-names>MY</given-names>
</name>
<name>
<surname>Choi</surname> <given-names>HM</given-names>
</name>
<name>
<surname>Jang</surname> <given-names>J</given-names>
</name>
<name>
<surname>Son</surname> <given-names>H</given-names>
</name>
<name>
<surname>Park</surname> <given-names>SS</given-names>
</name>
<name>
<surname>Song</surname> <given-names>M</given-names>
</name>
<etal/>
</person-group>. <article-title>Small multi-gene DNA panel can aid in reducing the surgical resection rate and predicting the Malignancy risk of thyroid nodules</article-title>. <source>Endocrinol Metab (Seoul)</source>. (<year>2024</year>) <volume>39</volume>:<page-range>777&#x2013;92</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.3803/EnM.2024.2034</pub-id>, PMID: <pub-id pub-id-type="pmid">39397516</pub-id></citation></ref>
<ref id="B42">
<label>42</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Alyusuf</surname> <given-names>EY</given-names>
</name>
<name>
<surname>Alhmayin</surname> <given-names>L</given-names>
</name>
<name>
<surname>Albasri</surname> <given-names>E</given-names>
</name>
<name>
<surname>Enani</surname> <given-names>J</given-names>
</name>
<name>
<surname>Altuwaijri</surname> <given-names>H</given-names>
</name>
<name>
<surname>Alsomali</surname> <given-names>N</given-names>
</name>
<etal/>
</person-group>. <article-title>Ultrasonographic predictors of thyroid cancer in Bethesda III and IV thyroid nodules</article-title>. <source>Front Endocrinol (Lausanne)</source>. (<year>2024</year>) <volume>15</volume>:<elocation-id>1326134</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fendo.2024.1326134</pub-id>, PMID: <pub-id pub-id-type="pmid">38405143</pub-id></citation></ref>
<ref id="B43">
<label>43</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wu</surname> <given-names>L</given-names>
</name>
<name>
<surname>Shu</surname> <given-names>H</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>W</given-names>
</name>
<name>
<surname>Gao</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Yuan</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Li</surname> <given-names>X</given-names>
</name>
<etal/>
</person-group>. <article-title>Diagnostic value of thyroid imaging reporting and data system combined with BRAF(V600E) mutation analysis in Bethesda categories III-V thyroid nodules</article-title>. <source>Sci Rep</source>. (<year>2022</year>) <volume>12</volume>:<fpage>5934</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41598-022-09822-5</pub-id>, PMID: <pub-id pub-id-type="pmid">35395862</pub-id></citation></ref>
<ref id="B44">
<label>44</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jin</surname> <given-names>L</given-names>
</name>
<name>
<surname>Xu</surname> <given-names>C</given-names>
</name>
<name>
<surname>Xie</surname> <given-names>X</given-names>
</name>
<name>
<surname>Li</surname> <given-names>F</given-names>
</name>
<name>
<surname>Lv</surname> <given-names>X</given-names>
</name>
<name>
<surname>Du</surname> <given-names>L</given-names>
</name>
</person-group>. <article-title>An algorithm of image heterogeneity with contrast-enhanced ultrasound in differential diagnosis of solid thyroid nodules</article-title>. <source>Ultrasound Med Biol</source>. (<year>2017</year>) <volume>43</volume>:<page-range>104&#x2013;10</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.ultrasmedbio.2016.05.011</pub-id>, PMID: <pub-id pub-id-type="pmid">28029495</pub-id></citation></ref>
<ref id="B45">
<label>45</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kim</surname> <given-names>J</given-names>
</name>
<name>
<surname>Shin</surname> <given-names>JH</given-names>
</name>
<name>
<surname>Oh</surname> <given-names>YL</given-names>
</name>
<name>
<surname>Hahn</surname> <given-names>SY</given-names>
</name>
<name>
<surname>Park</surname> <given-names>KW</given-names>
</name>
</person-group>. <article-title>Approach to Bethesda System category III thyroid nodules according to US-risk stratification</article-title>. <source>Endocr J</source>. (<year>2022</year>) <volume>69</volume>:<fpage>67</fpage>&#x2013;<lpage>74</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1507/endocrj.EJ21-0300</pub-id>, PMID: <pub-id pub-id-type="pmid">34408101</pub-id></citation></ref>
<ref id="B46">
<label>46</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lee</surname> <given-names>S</given-names>
</name>
<name>
<surname>Shin</surname> <given-names>JH</given-names>
</name>
<name>
<surname>Oh</surname> <given-names>YL</given-names>
</name>
<name>
<surname>Hahn</surname> <given-names>SY</given-names>
</name>
</person-group>. <article-title>Subcategorization of Bethesda System category III by ultrasonography</article-title>. <source>Thyroid</source>. (<year>2016</year>) <volume>26</volume>:<page-range>836&#x2013;42</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1089/thy.2015.0637</pub-id>, PMID: <pub-id pub-id-type="pmid">27094511</pub-id></citation></ref>
<ref id="B47">
<label>47</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Papapostolou</surname> <given-names>KD</given-names>
</name>
<name>
<surname>Evangelopoulou</surname> <given-names>CC</given-names>
</name>
<name>
<surname>Ioannidis</surname> <given-names>IA</given-names>
</name>
<name>
<surname>Kassi</surname> <given-names>GN</given-names>
</name>
<name>
<surname>Morfas</surname> <given-names>KS</given-names>
</name>
<name>
<surname>Karaminas</surname> <given-names>NI</given-names>
</name>
<etal/>
</person-group>. <article-title>Taller-than-wide thyroid nodules with microcalcifications are at high risk of Malignancy</article-title>. <source>In Vivo</source>. (<year>2020</year>) <volume>34</volume>:<page-range>2101&#x2013;05</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.21873/invivo.12014</pub-id>, PMID: <pub-id pub-id-type="pmid">32606189</pub-id></citation></ref>
<ref id="B48">
<label>48</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Alhajlan</surname> <given-names>M</given-names>
</name>
<name>
<surname>Al-Masabi</surname> <given-names>M</given-names>
</name>
<name>
<surname>Al Mansour</surname> <given-names>M</given-names>
</name>
<name>
<surname>Saihb</surname> <given-names>A</given-names>
</name>
<name>
<surname>AlAyed</surname> <given-names>S</given-names>
</name>
<name>
<surname>Alwadai</surname> <given-names>R</given-names>
</name>
<etal/>
</person-group>. <article-title>The accuracy of fine-needle aspiration cytology and ultrasonography in assessing thyroid nodules in correlation with histopathology: A retrospective study</article-title>. <source>Ann Med Surg (Lond)</source>. (<year>2024</year>) <volume>86</volume>:<page-range>7002&#x2013;09</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1097/ms9.0000000000002676</pub-id>, PMID: <pub-id pub-id-type="pmid">39649848</pub-id></citation></ref>
<ref id="B49">
<label>49</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Alden</surname> <given-names>J</given-names>
</name>
<name>
<surname>Lambrou</surname> <given-names>D</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>J</given-names>
</name>
</person-group>. <article-title>Two-tier subclassification of the Bethesda category III (Atypia of undetermined significance/follicular lesion of undetermined significance) in thyroid cytology</article-title>. <source>Diagn Cytopathol</source>. (<year>2024</year>) <volume>52</volume>:<page-range>156&#x2013;62</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/dc.25261</pub-id>, PMID: <pub-id pub-id-type="pmid">38095097</pub-id></citation></ref>
<ref id="B50">
<label>50</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jin</surname> <given-names>X</given-names>
</name>
<name>
<surname>Jing</surname> <given-names>X</given-names>
</name>
<name>
<surname>Smola</surname> <given-names>B</given-names>
</name>
<name>
<surname>Heider</surname> <given-names>A</given-names>
</name>
</person-group>. <article-title>Malignant risk of pediatric Bethesda category III thyroid nodules subcategorized by nuclear atypia and other: A single institution experience</article-title>. <source>Cancer Cytopathol</source>. (<year>2024</year>) <volume>132</volume>:<page-range>564&#x2013;68</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/cncy.22831</pub-id>, PMID: <pub-id pub-id-type="pmid">38771850</pub-id></citation></ref>
<ref id="B51">
<label>51</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bagis</surname> <given-names>M</given-names>
</name>
<name>
<surname>Can</surname> <given-names>N</given-names>
</name>
<name>
<surname>Sut</surname> <given-names>N</given-names>
</name>
<name>
<surname>Tastekin</surname> <given-names>E</given-names>
</name>
<name>
<surname>Erdogan</surname> <given-names>EG</given-names>
</name>
<name>
<surname>Bulbul</surname> <given-names>BY</given-names>
</name>
<etal/>
</person-group>. <article-title>A comprehensive approach to the thyroid Bethesda category III (AUS) in the transition zone between 2nd edition and 3rd edition of the Bethesda System for Reporting Thyroid Cytopathology: Subcategorization, nuclear scoring, and more</article-title>. <source>Endocr Pathol</source>. (<year>2024</year>) <volume>35</volume>:<fpage>51</fpage>&#x2013;<lpage>76</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s12022-024-09797-1</pub-id>, PMID: <pub-id pub-id-type="pmid">38280141</pub-id></citation></ref>
<ref id="B52">
<label>52</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jia</surname> <given-names>X</given-names>
</name>
<name>
<surname>Pang</surname> <given-names>P</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>L</given-names>
</name>
<name>
<surname>Zhao</surname> <given-names>L</given-names>
</name>
<name>
<surname>Jiang</surname> <given-names>L</given-names>
</name>
<name>
<surname>Song</surname> <given-names>Y</given-names>
</name>
<etal/>
</person-group>. <article-title>Clinical analysis of preoperative anti-thyroglobulin antibody in papillary thyroid cancer between 2011 and 2015 in Beijing, China: A retrospective study</article-title>. <source>Front Endocrinol (Lausanne)</source>. (<year>2020</year>) <volume>11</volume>:<elocation-id>452</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fendo.2020.00452</pub-id>, PMID: <pub-id pub-id-type="pmid">32760349</pub-id></citation></ref>
<ref id="B53">
<label>53</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Goecks</surname> <given-names>J</given-names>
</name>
<name>
<surname>Jalili</surname> <given-names>V</given-names>
</name>
<name>
<surname>Heiser</surname> <given-names>LM</given-names>
</name>
<name>
<surname>Gray</surname> <given-names>JW</given-names>
</name>
</person-group>. <article-title>How machine learning will transform biomedicine</article-title>. <source>Cell</source>. (<year>2020</year>) <volume>181</volume>:<fpage>92</fpage>&#x2013;<lpage>101</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.cell.2020.03.022</pub-id>, PMID: <pub-id pub-id-type="pmid">32243801</pub-id></citation></ref>
<ref id="B54">
<label>54</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Motamedi</surname> <given-names>F</given-names>
</name>
<name>
<surname>P&#xe9;rez-S&#xe1;nchez</surname> <given-names>H</given-names>
</name>
<name>
<surname>Mehridehnavi</surname> <given-names>A</given-names>
</name>
<name>
<surname>Fassihi</surname> <given-names>A</given-names>
</name>
<name>
<surname>Ghasemi</surname> <given-names>F</given-names>
</name>
</person-group>. <article-title>Accelerating big data analysis through lasso-random forest algorithm in QSAR studies</article-title>. <source>Bioinformatics</source>. (<year>2022</year>) <volume>38</volume>:<page-range>469&#x2013;75</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/bioinformatics/btab659</pub-id>, PMID: <pub-id pub-id-type="pmid">34979024</pub-id></citation></ref>
<ref id="B55">
<label>55</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Goin</surname> <given-names>JE</given-names>
</name>
</person-group>. <article-title>Classification bias of the k-nearest neighbor algorithm</article-title>. <source>IEEE Trans Pattern Anal Mach Intell</source>. (<year>1984</year>) <volume>6</volume>:<page-range>379&#x2013;81</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1109/tpami.1984.4767533</pub-id>, PMID: <pub-id pub-id-type="pmid">21869207</pub-id></citation></ref>
<ref id="B56">
<label>56</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rezvani</surname> <given-names>S</given-names>
</name>
<name>
<surname>Wu</surname> <given-names>J</given-names>
</name>
</person-group>. <article-title>Handling multi-class problem by intuitionistic fuzzy twin support vector machines based on relative density information</article-title>. <source>IEEE Trans Pattern Anal Mach Intell</source>. (<year>2023</year>) <volume>45</volume>:<page-range>14653&#x2013;64</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1109/tpami.2023.3310908</pub-id>, PMID: <pub-id pub-id-type="pmid">37651498</pub-id></citation></ref>
<ref id="B57">
<label>57</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jiang</surname> <given-names>W</given-names>
</name>
<name>
<surname>Li</surname> <given-names>Z</given-names>
</name>
</person-group>. <article-title>Comparison of machine learning algorithms and nomogram construction for diabetic retinopathy prediction in type 2 diabetes mellitus patients</article-title>. <source>Ophthalmic Res</source>. (<year>2024</year>) <volume>67</volume>:<page-range>537&#x2013;48</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1159/000541294</pub-id>, PMID: <pub-id pub-id-type="pmid">39231456</pub-id></citation></ref>
<ref id="B58">
<label>58</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Christodoulou</surname> <given-names>E</given-names>
</name>
<name>
<surname>Ma</surname> <given-names>J</given-names>
</name>
<name>
<surname>Collins</surname> <given-names>GS</given-names>
</name>
<name>
<surname>Steyerberg</surname> <given-names>EW</given-names>
</name>
<name>
<surname>Verbakel</surname> <given-names>JY</given-names>
</name>
<name>
<surname>Van Calster</surname> <given-names>B</given-names>
</name>
</person-group>. <article-title>A systematic review shows no performance benefit of machine learning over logistic regression for clinical prediction models</article-title>. <source>J Clin Epidemiol</source>. (<year>2019</year>) <volume>110</volume>:<fpage>12</fpage>&#x2013;<lpage>22</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.jclinepi.2019.02.004</pub-id>, PMID: <pub-id pub-id-type="pmid">30763612</pub-id></citation></ref>
<ref id="B59">
<label>59</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>&#xd6;cal</surname> <given-names>B</given-names>
</name>
<name>
<surname>Korkmaz</surname> <given-names>MH</given-names>
</name>
<name>
<surname>Y&#x131;lmazer</surname> <given-names>D</given-names>
</name>
<name>
<surname>Ta&#x15f;k&#x131;n T&#xfc;rkmeno&#x11f;lu</surname> <given-names>T</given-names>
</name>
<name>
<surname>Bay&#x131;r</surname> <given-names>&#xd6;</given-names>
</name>
<name>
<surname>&#xc7;adall&#x131; Tatar</surname> <given-names>E</given-names>
</name>
<etal/>
</person-group>. <article-title>The Malignancy risk assessment of cytologically indeterminate thyroid nodules improves markedly by using a predictive model</article-title>. <source>Eur Thyroid J</source>. (<year>2019</year>) <volume>8</volume>:<page-range>83&#x2013;9</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1159/000494720</pub-id>, PMID: <pub-id pub-id-type="pmid">31192147</pub-id></citation></ref>
</ref-list>
</back>
</article>