<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article article-type="research-article" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Surg.</journal-id>
<journal-title>Frontiers in Surgery</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Surg.</abbrev-journal-title>
<issn pub-type="epub">2296-875X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fsurg.2023.1095545</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Surgery</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>A machine learning-based model for predicting the risk of early-stage inguinal lymph node metastases in patients with squamous cell carcinoma of the penis</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author"><name><surname>Ding</surname><given-names>Li</given-names></name>
<xref ref-type="author-notes" rid="an1"><sup>&#x2020;</sup></xref><uri xlink:href="https://loop.frontiersin.org/people/1668373/overview"/></contrib>
<contrib contrib-type="author"><name><surname>Zhang</surname><given-names>Chi</given-names></name>
<xref ref-type="author-notes" rid="an1"><sup>&#x2020;</sup></xref><uri xlink:href="https://loop.frontiersin.org/people/1760275/overview" /></contrib>
<contrib contrib-type="author"><name><surname>Wang</surname><given-names>Kun</given-names></name><uri xlink:href="https://loop.frontiersin.org/people/1756169/overview" /></contrib>
<contrib contrib-type="author"><name><surname>Zhang</surname><given-names>Yang</given-names></name><uri xlink:href="https://loop.frontiersin.org/people/1613128/overview" /></contrib>
<contrib contrib-type="author"><name><surname>Wu</surname><given-names>Chuang</given-names></name><uri xlink:href="https://loop.frontiersin.org/people/1846354/overview" /></contrib>
<contrib contrib-type="author"><name><surname>Xia</surname><given-names>Wentao</given-names></name>
<uri xlink:href="https://loop.frontiersin.org/people/1994405/overview" /></contrib>
<contrib contrib-type="author"><name><surname>Li</surname><given-names>Shuaishuai</given-names></name><uri xlink:href="https://loop.frontiersin.org/people/1750518/overview" /></contrib>
<contrib contrib-type="author" corresp="yes"><name><surname>Li</surname><given-names>Wang</given-names></name>
<xref ref-type="corresp" rid="cor1">&#x002A;</xref></contrib>
<contrib contrib-type="author" corresp="yes"><name><surname>Wang</surname><given-names>Junqi</given-names></name>
<xref ref-type="corresp" rid="cor1">&#x002A;</xref></contrib>
</contrib-group>
<aff><addr-line>Department of Urology</addr-line>, <institution>the Affiliated Hospital of Xuzhou Medical University</institution>, <addr-line>Xuzhou</addr-line>, <country>China</country></aff>
<author-notes>
<fn fn-type="edited-by"><p><bold>Edited by:</bold> Alessio G. Morganti, University of Bologna, Italy</p></fn>
<fn fn-type="edited-by"><p><bold>Reviewed by:</bold> Andrey O Morozov, I.M. Sechenov First Moscow State Medical University, Russia Jiaheng Xie, Nanjing Medical University, China Wencai Liu, The First Affiliated Hospital of Nanchang University, China</p></fn>
<corresp id="cor1"><label>&#x002A;</label><bold>Correspondence:</bold> Wang Li <email>lizhixin88mm@163.com</email> Junqi Wang <email>wjq68@sina.cn</email></corresp>
<fn id="an1"><label><sup>&#x2020;</sup></label><p>These authors share first authorship</p></fn>
<fn fn-type="other" id="fn001"><p><bold>Specialty Section:</bold> This article was submitted to Genitourinary Surgery, a section of the journal Frontiers in Surgery</p></fn>
</author-notes>
<pub-date pub-type="epub"><day>17</day><month>03</month><year>2023</year></pub-date>
<pub-date pub-type="collection"><year>2023</year></pub-date>
<volume>10</volume><elocation-id>1095545</elocation-id>
<history>
<date date-type="received"><day>11</day><month>11</month><year>2022</year></date>
<date date-type="accepted"><day>07</day><month>02</month><year>2023</year></date>
</history>
<permissions>
<copyright-statement>&#x00A9; 2023 Ding, Zhang, Wang, Zhang, Wu, Xia, Li, Li and Wang.</copyright-statement>
<copyright-year>2023</copyright-year><copyright-holder>Ding, Zhang, Wang, Zhang, Wu, Wentao, Li, Li and Wang</copyright-holder><license license-type="open-access" xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="http://creativecommons.org/licenses/by/4.0/">Creative Commons Attribution License (CC BY)</ext-link>. The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p></license>
</permissions>
<abstract>
<sec><title>Objective</title>
<p>Inguinal lymph node metastasis (ILNM) is significantly associated with poor prognosis in patients with squamous cell carcinoma of the penis (SCCP). Patient prognosis could be improved if the probability of ILNM incidence could be accurately predicted at an early stage. We developed a predictive model based on machine learning combined with big data to achieve this.</p>
</sec>
<sec><title>Methods</title>
<p>Data of patients diagnosed with SCCP were obtained from the Surveillance, Epidemiology, and End Results Program Research Data. By combing variables that represented the patients&#x0027; clinical characteristics, we applied five machine learning algorithms to create predictive models based on logistic regression, eXtreme Gradient Boosting, Random Forest, Support Vector Machine, and k-Nearest Neighbor. Model performance was evaluated by ten-fold cross-validation receiver operating characteristic curves, which were used to calculate the area under the curve of the five models for predictive accuracy. Decision curve analysis was conducted to estimate the clinical utility of the models. An external validation cohort of 74 SCCP patients was selected from the Affiliated Hospital of Xuzhou Medical University (February 2008 to March 2021).</p>
</sec>
<sec><title>Results</title>
<p>A total of 1,056 patients with SCCP from the SEER database were enrolled as the training cohort, of which 164 (15.5&#x0025;) developed early-stage ILNM. In the external validation cohort, 16.2&#x0025; of patients developed early-stage ILNM. Multivariate logistic regression showed that tumor grade, inguinal lymph node dissection, radiotherapy, and chemotherapy were independent predictors of early-stage ILNM risk. The model based on the eXtreme Gradient Boosting algorithm showed stable and efficient prediction performance in both the training and external validation groups.</p>
</sec>
<sec><title>Conclusion</title>
<p>The ML model based on the XGB algorithm has high predictive effectiveness and may be used to predict early-stage ILNM risk in SCCP patients. Therefore, it may show promise in clinical decision-making.</p>
</sec>
</abstract>
<kwd-group>
<kwd>machine learning algorithms</kwd>
<kwd>prediction model</kwd>
<kwd>penis cancer</kwd>
<kwd>squamous cell carcinoma</kwd>
<kwd>inguinal lymph node metastases</kwd>
<kwd>real-world research</kwd>
</kwd-group>
<contract-num rid="cn001">XWRCHT20210027</contract-num>
<contract-sponsor id="cn001">Xuzhou Medical Leading Talents Training Project</contract-sponsor>
<counts>
<fig-count count="5"/>
<table-count count="3"/><equation-count count="0"/><ref-count count="34"/><page-count count="0"/><word-count count="0"/></counts>
</article-meta>
</front>
<body>
<sec id="s1" sec-type="intro"><title>Introduction</title>
<p>Penile carcinoma (PC) is a rare malignant tumor of the genitourinary system that exhibits a predilection for the glans and inner prepuce (<xref ref-type="bibr" rid="B1">1</xref>). The overall incidence of PC in men in developed countries such as Europe and the United States is less than 1 in 100,000, and it accounts for approximately 0.24&#x0025; of all new cancer cases in men (<xref ref-type="bibr" rid="B2">2</xref>, <xref ref-type="bibr" rid="B3">3</xref>). In contrast, PC accounts for 2&#x0025; of malignancies in men in less developed countries or regions such as Africa and South America, and in some places like Uganda, the incidence is even higher than 8/100,000 (<xref ref-type="bibr" rid="B4">4</xref>, <xref ref-type="bibr" rid="B5">5</xref>). This phenomenon could be linked to risk factors such as poor economic conditions, a high prevalence of HPV infection, and phimosis (<xref ref-type="bibr" rid="B6">6</xref>, <xref ref-type="bibr" rid="B7">7</xref>). Squamous cell carcinoma accounts for more than 95&#x0025; of penile cancers and is the most common histologic type (<xref ref-type="bibr" rid="B8">8</xref>). The risk of developing squamous cell carcinoma of the penis (SCCP) increases with age, with the peak age range being 50 to 70 years (<xref ref-type="bibr" rid="B9">9</xref>). For the surgical treatment of SCCP, the aim of primary tumor treatment is to completely remove the tumor and preserve as many organs as possible without compromising control of the tumor. However, for advanced invasive tumors, partial or radical penectomy is unavoidable (<xref ref-type="bibr" rid="B10">10</xref>).</p>
<p>Lymph node invasion of SCCP conforms to the anatomy, and it most commonly metastasizes to the inguinal lymph nodes, followed by the pelvic lymph nodes. Superficial and deep inguinal lymph nodes are the first regional lymph nodes to be invaded, most commonly in the superior medial region, either unilaterally or bilaterally (<xref ref-type="bibr" rid="B11">11</xref>). Previous studies have shown that the occurrence of lymph node metastases in SCCP patients is significantly associated with poor prognosis (<xref ref-type="bibr" rid="B12">12</xref>). The survival rate of patients with SCCP decreases dramatically with increase in lymph node invasion. The five-year survival rate of patients with inguinal lymph node metastasis (ILNM) is only 50&#x0025;&#x2013;80&#x0025;, but the five-year survival rate of patients who develop pelvic lymph node and peripheral lymph node invasion is less than 33&#x0025; (<xref ref-type="bibr" rid="B13">13</xref>, <xref ref-type="bibr" rid="B14">14</xref>). Due to limitations in imaging techniques, up to 25&#x0025; of cases in patients with clinically negative lymph nodes cannot be detected despite the presence of micrometastases (<xref ref-type="bibr" rid="B15">15</xref>). Therefore, identifying independent risk factors for the development of ILNM at an early stage and establishing corresponding risk prediction models for identifying patients at high risk of ILNM can improve the survival prognosis of this group of SCCP patients through more frequent imaging and more comprehensive clinical treatment in the early stage of diagnosis.</p>
<p>Early studies had shown that stage and grade of the tumor as well as lymphatic and vascular embolization were associated with the risk of lymph node metastasis (<xref ref-type="bibr" rid="B16">16</xref>, <xref ref-type="bibr" rid="B17">17</xref>). Ficarra et al. showed that pT stage, histologic grade, venous embolization, and lymphatic embolization were independent predictors of lymph node metastasis in SCCP (<xref ref-type="bibr" rid="B18">18</xref>). Peak et al. developed a predictive model based on the clinicopathological characteristics of patients recorded in the National Cancer Database (NCDB), which showed better efficacy in their internal validation (<xref ref-type="bibr" rid="B19">19</xref>). In previous studies, several prediction nomograms were established based on logistic regression. The traditional logistic regression algorithm has some limitations in terms of nonlinear complex computation, with area under the curve (AUC) both less than 0.8, so this leaves room for further optimization (<xref ref-type="bibr" rid="B20">20</xref>, <xref ref-type="bibr" rid="B21">21</xref>). Machine learning (ML) is an advanced algorithmic model that automatically learns and improves performance by identifying complex nonlinear relationships in different patterns, and is considered superior to traditional algorithms (<xref ref-type="bibr" rid="B22">22</xref>). As one of the components of artificial intelligence, ML has been widely used in clinical practice, such as for epidemic prediction (<xref ref-type="bibr" rid="B23">23</xref>, <xref ref-type="bibr" rid="B24">24</xref>), and survival analysis (<xref ref-type="bibr" rid="B25">25</xref>, <xref ref-type="bibr" rid="B26">26</xref>). ML models have also been proposed for the prediction of lymph node metastasis in a variety of malignancies (<xref ref-type="bibr" rid="B27">27</xref>, <xref ref-type="bibr" rid="B28">28</xref>). Based on these promising clinical applications of ML models, the present study aimed to develop and validate a novel ML-based model for predicting the risk of early-stage ILNM in patients with SCCP.</p>
</sec>
<sec id="s2"><title>Materials and methods</title>
<sec id="s2a"><title>Data source and study population</title>
<p>A retrospective cohort design was adopted. Data were obtained from the SEER research database, which covers roughly 27.8&#x0025; of the US population. The SEER database is a comprehensive data source, which is public and identifiably accessible that data analysis is treated as non-human subjects. Therefore no institutional review board approval and informed consent were required. We used the ICD-O-3 site codes C60.0 to C60.8 and histological codes 8,051&#x2013;8,052 and 8,070&#x2013;8,075 to identify SCCP patients. To develop the ideal ML model, several variables were obtained, including survival data, age at diagnosis, race, marital status at diagnosis, primary site, tumor size, tumor grade, surgical procedure, inguinal lymph node dissection (ILND), lymph-vascular invasion (LVI), TNM stage, radiotherapy data, and chemotherapy data. We grouped ethnicity into white, black and other; and marital status into married and other. An external validation set was constructed by collecting data on the same variables from our center based on the same criteria. A flow chart for patient selection from the SEER database is shown in <xref ref-type="sec" rid="s11">Supplementary Figure S1</xref>. Early-stage ILNM was defined as N1 and N2 stage, i.e., unilateral or bilateral untreated ILNM.</p>
</sec>
<sec id="s2b"><title>Statistical analysis</title>
<p>For continuous variables, Student&#x0027;s <italic>t</italic>-test was used for normally distributed data and the Mann Whitney <italic>U</italic>-test was used for non-normally distributed data. The chi-square test was used to analyze categorical data. Categorical variables were one-hot-encoded before incorporated into the ML algorithms.The odds ratio (OR) with 95&#x0025; confidence intervals (CI) was calculated using univariate and multivariate logistic regression analysis. Only two-sided <italic>p</italic>-values &#x003C;0.05 were considered to indicate statistical significance. We used five different ML algorithms to analyze our data: LR, XGB, RF, SVM, and kNN. The model with the highest average AUC was considered as the best algorithm. Furthermore, the ML-based model was tuned to avoid overfitting, and the accuracy of the algorithm was tested using the ten-fold cross-validation method. Detailed packages used in the development of our ML models including XGB 1.2.1, lightGBM 3.2.1, and sklearn 0.22.1. In the RF algorithm, the number of decision trees was set to 100, the maximum tree depth was set to 10, and the maximum number of leaf nodes was set to 50. In the kNN algorithm, the number of leaves was set to 30, and the number of nearest neighbors was set to 5. R 4.1.2 (<ext-link ext-link-type="uri" xlink:href="https://www.r-project.org/">https://www.r-project.org/</ext-link>), Python 3.10 (<ext-link ext-link-type="uri" xlink:href="https://www.python.org/">https://www.python.org/</ext-link>), and SEER&#x002A;Stat (<ext-link ext-link-type="uri" xlink:href="https://seer.cancer.gov/seers">https://seer.cancer.gov/seers</ext-link> tat/) were used in this study.</p>
</sec>
</sec>
<sec id="s3" sec-type="results"><title>Results</title>
<sec id="s3a"><title>Patient characteristics</title>
<p>Baseline data for the training cohort and external validation cohort are provided in <xref ref-type="table" rid="T1">Table&#x00A0;1</xref>. In the training cohort, the variables with <italic>p</italic> values &#x003C;0.05 were age, tumor size, marital status, tumor grade, T-stage, ILND, LVI, radiotherapy, and chemotherapy. Patients who developed early-stage ILNM were younger compared to those with stage N0 ILNM; had undergone ILND; and had larger tumor size, poorer grade, and higher T-stage. Further, a higher proportion of patients with early-stage ILNM had LVI and were receiving radiotherapy/chemotherapy. No statistically significant differences were found in race or primary site. The correlations between the variables chosen as predictors were analyzed and visualized by a heatmap using Spearman&#x0027;s rank correlation coefficient (<xref ref-type="fig" rid="F1">Figure&#x00A0;1</xref>).</p>
<fig id="F1" position="float"><label>Figure 1</label>
<caption><p>The results of Spearman correlation analysis between all the variables. The heat map shows the correlation between SCCP patients&#x2019; clinical and pathological features.</p></caption>
<graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="fsurg-10-1095545-g001.tif"/>
</fig>
<table-wrap id="T1" position="float"><label>Table 1</label>
<caption><p>Baseline characteristics of SCCP patients in the SEER database.</p></caption>
<table frame="hsides" rules="groups">
<colgroup>
<col align="left"/>
<col align="left"/>
<col align="center"/>
<col align="center"/>
<col align="center"/>
<col align="center"/>
<col align="center"/>
<col align="center"/>
</colgroup>
<thead>
<tr>
<th valign="top" align="left">Variables</th>
<th valign="top" align="center">Level</th>
<th valign="top" align="center" colspan="3">Training cohort</th>
<th valign="top" align="center" colspan="3">External validation cohort</th>
</tr>
<tr>
<th valign="top" align="center"><italic>&#x00A0;</italic></th>
<th valign="top" align="center"/>
<th valign="top" align="center">N0 (<italic>n</italic>&#x2009;&#x003D;&#x2009;892)</th>
<th valign="top" align="center">N1&#x2013;N2 (<italic>n</italic>&#x2009;&#x003D;&#x2009;164)</th>
<th valign="top" align="center"><italic>p</italic>-value</th>
<th valign="top" align="center">N0 (<italic>n</italic>&#x2009;&#x003D;&#x2009;62)</th>
<th valign="top" align="center">N1&#x2013;N2 (<italic>n</italic>&#x2009;&#x003D;&#x2009;12)</th>
<th valign="top" align="center"><italic>p</italic>-value</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top">Age, year [median (IQR)]</td>
<td valign="top">NA</td>
<td valign="top" align="center">67.000 [57.000,75.000]</td>
<td valign="top" align="center">64.000 [52.000,73.000]</td>
<td valign="top" align="center"><bold>0.003</bold></td>
<td valign="top" align="center">64.000 [59.000,74.000]</td>
<td valign="top" align="center">67.000 [51.000,75.000]</td>
<td valign="top" align="center"><bold>0.809</bold></td>
</tr>
<tr>
<td valign="top">Tumor Size, mm [median (IQR)]</td>
<td valign="top">NA</td>
<td valign="top" align="center">27.000 [18.000,39.000]</td>
<td valign="top" align="center">35.000 [25.000,45.000]</td>
<td valign="top" align="center"><bold>&#x003C;0.001</bold></td>
<td valign="top" align="center">32.000 [25.000,40.000]</td>
<td valign="top" align="center">40.000 [30.000,50.000]</td>
<td valign="top" align="center"><bold>0.161</bold></td>
</tr>
<tr>
<td valign="top" align="left" rowspan="3">Race, <italic>n</italic> (&#x0025;)</td>
<td valign="top">White</td>
<td valign="top" align="center">763 (85.538)</td>
<td valign="top" align="center">137 (83.537)</td>
<td valign="top" align="center" rowspan="3"><bold>0.552</bold></td>
<td valign="top" align="center">/</td>
<td valign="top" align="center">/</td>
<td valign="top" align="center" rowspan="3"><bold>/</bold></td>
</tr>
<tr>
<td valign="top">Black</td>
<td valign="top">78 (8.744)</td>
<td valign="top" align="center">14 (8.537)</td>
<td valign="top" align="center">/</td>
<td valign="top" align="center">/</td>
</tr>
<tr>
<td valign="top">Other/Unknown</td>
<td valign="top">51 (5.717)</td>
<td valign="top" align="center">13 (7.927)</td>
<td valign="top" align="center">62 (100.000)</td>
<td valign="top" align="center">12 (100.000)</td>
</tr>
<tr>
<td valign="top" align="left" rowspan="2">Marital status, <italic>n</italic> (&#x0025;)</td>
<td valign="top">Married</td>
<td valign="top" align="center">562 (63.004)</td>
<td valign="top" align="center">84 (51.220)</td>
<td valign="top" align="center" rowspan="2"><bold>0.004</bold></td>
<td valign="top" align="center">60 (96.774)</td>
<td valign="top" align="center">9 (75.000)</td>
<td valign="top" align="center" rowspan="2"><bold>0.006</bold></td>
</tr>
<tr>
<td valign="top">Other status</td>
<td valign="top">330 (36.996)</td>
<td valign="top" align="center">80 (48.780)</td>
<td valign="top" align="center">2 (3.226)</td>
<td valign="top" align="center">3 (25.000)</td>
</tr>
<tr>
<td valign="top" align="left" rowspan="4">Primary site, <italic>n</italic> (&#x0025;)</td>
<td valign="top">Prepuce</td>
<td valign="top" align="center">187 (20.964)</td>
<td valign="top" align="center">23 (14.024)</td>
<td valign="top" align="center" rowspan="4"><bold>0.138</bold></td>
<td valign="top" align="center">6 (9.677)</td>
<td valign="top" align="center">0 (0.000)</td>
<td valign="top" align="center" rowspan="4"><bold>/</bold></td>
</tr>
<tr>
<td valign="top">Glans penis</td>
<td valign="top">565 (63.341)</td>
<td valign="top" align="center">109 (66.463)</td>
<td valign="top" align="center">25 (40.323)</td>
<td valign="top" align="center">4 (33.333)</td>
</tr>
<tr>
<td valign="top">Body of penis</td>
<td valign="top">72 (8.072)</td>
<td valign="top" align="center">14 (8.537)</td>
<td valign="top" align="center">28 (45.161)</td>
<td valign="top" align="center">6 (50.000)</td>
</tr>
<tr>
<td valign="top">Overlapping lesion of penis</td>
<td valign="top">68 (7.623)</td>
<td valign="top" align="center">18 (10.976)</td>
<td valign="top" align="center">3 (4.839)</td>
<td valign="top" align="center">2 (16.667)</td>
</tr>
<tr>
<td valign="top" align="left" rowspan="4">Tumor grade, <italic>n</italic> (&#x0025;)</td>
<td valign="top">Well differentiated</td>
<td valign="top" align="center">300 (33.632)</td>
<td valign="top" align="center">15 (9.146)</td>
<td valign="top" align="center" rowspan="4"><bold>&#x003C;0.001</bold></td>
<td valign="top" align="center">35 (56.452)</td>
<td valign="top" align="center">2 (16.667)</td>
<td valign="top" align="center" rowspan="4"><bold>0.003</bold></td>
</tr>
<tr>
<td valign="top">Moderately differentiated</td>
<td valign="top">438 (49.103)</td>
<td valign="top" align="center">89 (54.268)</td>
<td valign="top" align="center">19 (30.645)</td>
<td valign="top" align="center">3 (25.000)</td>
</tr>
<tr>
<td valign="top">Poorly differentiated</td>
<td valign="top">150 (16.816)</td>
<td valign="top" align="center">59 (35.976)</td>
<td valign="top" align="center">6 (9.677)</td>
<td valign="top" align="center">6 (50.000)</td>
</tr>
<tr>
<td valign="top">Undifferentiated/Anaplastic</td>
<td valign="top">4 (0.448)</td>
<td valign="top" align="center">1 (0.610)</td>
<td valign="top" align="center">2 (3.226)</td>
<td valign="top" align="center">1 (8.333)</td>
</tr>
<tr>
<td valign="top" align="left" rowspan="4">T stage, <italic>n</italic> (&#x0025;)</td>
<td valign="top">Ta-T1</td>
<td valign="top" align="center">506 (56.726)</td>
<td valign="top" align="center">36 (21.951)</td>
<td valign="top" align="center" rowspan="4"><bold>&#x003C;0.001</bold></td>
<td valign="top" align="center">44 (70.968)</td>
<td valign="top" align="center">2 (16.667)</td>
<td valign="top" align="center" rowspan="4"><bold>/</bold></td>
</tr>
<tr>
<td valign="top">T2</td>
<td valign="top">254 (28.475)</td>
<td valign="top" align="center">70 (42.683)</td>
<td valign="top" align="center">15 (24.194)</td>
<td valign="top" align="center">4 (33.333)</td>
</tr>
<tr>
<td valign="top">T3</td>
<td valign="top">128 (14.350)</td>
<td valign="top" align="center">55 (33.537)</td>
<td valign="top" align="center">3 (4.839)</td>
<td valign="top" align="center">4 (33.333)</td>
</tr>
<tr>
<td valign="top">T4</td>
<td valign="top">4 (0.448)</td>
<td valign="top" align="center">3 (1.829)</td>
<td valign="top" align="center">0 (0.000)</td>
<td valign="top" align="center">2 (16.667)</td>
</tr>
<tr>
<td valign="top" align="left" rowspan="2">ILND, <italic>n</italic> (&#x0025;)</td>
<td valign="top">No/Biopsy only</td>
<td valign="top" align="center">755 (84.641)</td>
<td valign="top" align="center">44 (26.829)</td>
<td valign="top" align="center" rowspan="2"><bold>&#x003C;0.001</bold></td>
<td valign="top" align="center">57 (91.935)</td>
<td valign="top" align="center">8 (66.667)</td>
<td valign="top" align="center" rowspan="2"><bold>0.014</bold></td>
</tr>
<tr>
<td valign="top">Yes</td>
<td valign="top">137 (15.359)</td>
<td valign="top" align="center">120 (73.171)</td>
<td valign="top" align="center">5 (8.065)</td>
<td valign="top" align="center">4 (33.333)</td>
</tr>
<tr>
<td valign="top" align="left" rowspan="2">LVI, <italic>n</italic> (&#x0025;)</td>
<td valign="top">Absent/Unknown</td>
<td valign="top" align="center">824 (92.377)</td>
<td valign="top" align="center">123 (75.000)</td>
<td valign="top" align="center" rowspan="2"><bold>&#x003C;0.001</bold></td>
<td valign="top" align="center">58 (93.548)</td>
<td valign="top" align="center">4 (33.333)</td>
<td valign="top" align="center" rowspan="2"><bold>&#x003C;0.001</bold></td>
</tr>
<tr>
<td valign="top">Present</td>
<td valign="top">68 (7.623)</td>
<td valign="top" align="center">41 (25.000)</td>
<td valign="top" align="center">4 (6.452)</td>
<td valign="top" align="center">8 (66.667)</td>
</tr>
<tr>
<td valign="top" align="left" rowspan="2">Radiotherapy, <italic>n</italic> (&#x0025;)</td>
<td valign="top">No/Unknown</td>
<td valign="top" align="center">853 (95.628)</td>
<td valign="top" align="center">127 (77.439)</td>
<td valign="top" align="center" rowspan="2"><bold>&#x003C;0.001</bold></td>
<td valign="top" align="center">52 (83.871)</td>
<td valign="top" align="center">8 (66.667)</td>
<td valign="top" align="center" rowspan="2"><bold>0.164</bold></td>
</tr>
<tr>
<td valign="top">Yes</td>
<td valign="top">39 (4.372)</td>
<td valign="top" align="center">37 (22.561)</td>
<td valign="top" align="center">10 (16.129)</td>
<td valign="top" align="center">4 (33.333)</td>
</tr>
<tr>
<td valign="top" align="left" rowspan="2">Chemotherapy, <italic>n</italic> (&#x0025;)</td>
<td valign="top">No/Unknown</td>
<td valign="top" align="center">870 (97.534)</td>
<td valign="top" align="center">112 (68.293)</td>
<td valign="top" align="center" rowspan="2"><bold>&#x003C;0.001</bold></td>
<td valign="top" align="center">58 (93.548)</td>
<td valign="top" align="center">9 (75.000)</td>
<td valign="top" align="center" rowspan="2"><bold>0.044</bold></td>
</tr>
<tr>
<td valign="top">Yes</td>
<td valign="top">22 (2.466)</td>
<td valign="top" align="center">52 (31.707)</td>
<td valign="top" align="center">4 (6.452)</td>
<td valign="top" align="center">3 (25.000)</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn id="table-fn1"><p>ILND, Inguinal lymph node dissection; LVI, Lymph-vascular invasion, Other status including single, divorced, separated, divorced and unknown.</p></fn>
</table-wrap-foot>
</table-wrap>
</sec>
<sec id="s3b"><title>Survival analysis</title>
<p>We retrieved patients&#x0027; survival data from the SEER database. Cancer-specific survival (CSS) was considered as the endpoint, and Kaplan-Meier survival analysis was used to estimate the survival. As shown in <xref ref-type="fig" rid="F2">Figure&#x00A0;2</xref>, patients with early-stage ILNM had significantly worse CSS (<italic>p</italic>&#x2009;&#x003C;&#x2009;0.0001).</p>
<fig id="F2" position="float"><label>Figure 2</label>
<caption><p>Kaplan-Meier curve of cancer-specific survival in SCCP patients.</p></caption>
<graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="fsurg-10-1095545-g002.tif"/>
</fig>
</sec>
<sec id="s3c"><title>Univariate and multivariate logistic regression analyses</title>
<p>As illustrated in <xref ref-type="table" rid="T2">Table&#x00A0;2</xref>, univariate logistic regression analysis showed that age, marital status, tumor grade, T-stage, ILND, LVI, radiotherapy, and chemotherapy were all significantly associated with the occurrence of early-stage ILNM in the overall population (<italic>p</italic>&#x2009;&#x003C;&#x2009;0.05). In multivariable logistic regression analysis, the factors with statistical significance included tumor grade (<italic>p</italic>&#x2009;&#x003D;&#x2009;0.001), T stage (<italic>p</italic>&#x2009;&#x003D;&#x2009;0.05), ILND (OR&#x2009;&#x003D;&#x2009;11.044, 95&#x0025; CI&#x2009;&#x003D;&#x2009;6.984&#x2013;17.846, <italic>p</italic>&#x2009;&#x003C;&#x2009;0.001), radiotherapy (OR&#x2009;&#x003D;&#x2009;4.64, 95&#x0025; CI&#x2009;&#x003D;&#x2009;2.361&#x2013;9.145, <italic>p</italic>&#x2009;&#x003C;&#x2009;0.001), and chemotherapy (OR&#x2009;&#x003D;&#x2009;9.612, 95&#x0025; CI&#x2009;&#x003D;&#x2009;4.971&#x2013;19.138, <italic>p</italic>&#x2009;&#x003C;&#x2009;0.001).</p>
<table-wrap id="T2" position="float"><label>Table 2</label>
<caption><p>Univariable and multivariate logistic regression analysis of the training cohort for predicting ILNM risk.</p></caption>
<table frame="hsides" rules="groups">
<colgroup>
<col align="left"/>
<col align="left"/>
<col align="center"/>
<col align="center"/>
<col align="center"/>
<col align="center"/>
<col align="center"/>
<col align="center"/>
</colgroup>
<thead>
<tr>
<th valign="top" align="left">Variables</th>
<th valign="top" align="center">Level</th>
<th valign="top" align="center">Univariate OR</th>
<th valign="top" align="center">95&#x0025;CI</th>
<th valign="top" align="center"><italic>p</italic>-value</th>
<th valign="top" align="center">Multivariate OR</th>
<th valign="top" align="center">95&#x0025;CI</th>
<th valign="top" align="center"><italic>p</italic>-value</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Age</td>
<td valign="top" align="left">NA</td>
<td valign="top" align="center">0.98</td>
<td valign="top" align="center">[0.967,0.992]</td>
<td valign="top" align="center"><bold>0.001</bold></td>
<td valign="top" align="center">0.997</td>
<td valign="top" align="center">[0.98,1.014]</td>
<td valign="top" align="center">0.704</td>
</tr>
<tr>
<td valign="top" align="left">Tumor size</td>
<td valign="top" align="left">NA</td>
<td valign="top" align="center">1.002</td>
<td valign="top" align="center">[1.000,1.004]</td>
<td valign="top" align="center">0.083</td>
<td valign="top" align="center">/</td>
<td valign="top" align="center">/</td>
<td valign="top" align="center">/</td>
</tr>
<tr>
<td valign="top" align="left" rowspan="3">Race</td>
<td valign="top" align="left">White</td>
<td valign="top" align="center">Ref</td>
<td valign="top" align="center"/>
<td valign="top" align="center">0.555</td>
<td valign="top" align="center">/</td>
<td valign="top" align="center">/</td>
<td valign="top" align="center">/</td>
</tr>
<tr>
<td valign="top" align="left">Black</td>
<td valign="top" align="left">1</td>
<td valign="top" align="center">[0.550,1.816]</td>
<td valign="top" align="center">0.999</td>
<td valign="top" align="center">/</td>
<td valign="top" align="center">/</td>
<td valign="top" align="center">/</td>
</tr>
<tr>
<td valign="top" align="left">Other/Unknown</td>
<td valign="top" align="left">1.42</td>
<td valign="top" align="center">[0.752,2.680]</td>
<td valign="top" align="center">0.28</td>
<td valign="top" align="center">/</td>
<td valign="top" align="center">/</td>
<td valign="top" align="center">/</td>
</tr>
<tr>
<td valign="top" align="left" rowspan="2">Marital status</td>
<td valign="top" align="left">Married</td>
<td valign="top" align="center">Ref</td>
<td valign="top" align="center"/>
<td valign="top" align="center"><bold>0.005</bold></td>
<td valign="top" align="center">Ref</td>
<td valign="top" align="center"/>
<td valign="top" align="center">0.08</td>
</tr>
<tr>
<td valign="top" align="left">Other status</td>
<td valign="top" align="left">1.622</td>
<td valign="top" align="center">[1.160,2.267]</td>
<td valign="top" align="center"/>
<td valign="top" align="center">1.481</td>
<td valign="top" align="center">[0.953,2.304]</td>
<td valign="top" align="center"/>
</tr>
<tr>
<td valign="top" align="left" rowspan="4">Primary site</td>
<td valign="top" align="left">Prepuce</td>
<td valign="top" align="center">Ref</td>
<td valign="top" align="center"/>
<td valign="top" align="center">0.144</td>
<td valign="top" align="center">/</td>
<td valign="top" align="center">/</td>
<td valign="top" align="center">/</td>
</tr>
<tr>
<td valign="top" align="left">Glans penis</td>
<td valign="top" align="left">1.569</td>
<td valign="top" align="center">[0.971,2.533]</td>
<td valign="top" align="center">0.066</td>
<td valign="top" align="center">/</td>
<td valign="top" align="center">/</td>
<td valign="top" align="center">/</td>
</tr>
<tr>
<td valign="top" align="left">Body of penis</td>
<td valign="top" align="left">1.581</td>
<td valign="top" align="center">[0.771,3.241]</td>
<td valign="top" align="center">0.211</td>
<td valign="top" align="center">/</td>
<td valign="top" align="center">/</td>
<td valign="top" align="center">/</td>
</tr>
<tr>
<td valign="top" align="left">Overlapping lesion of penis</td>
<td valign="top" align="left">2.152</td>
<td valign="top" align="center">[1.094,4.233]</td>
<td valign="top" align="center">0.026</td>
<td valign="top" align="center">/</td>
<td valign="top" align="center">/</td>
<td valign="top" align="center">/</td>
</tr>
<tr>
<td valign="top" align="left" rowspan="4">Tumor grade</td>
<td valign="top" align="left">Well differentiated</td>
<td valign="top" align="center">Ref</td>
<td valign="top" align="center"/>
<td valign="top" align="center"><bold>&#x003C;0.001</bold></td>
<td valign="top" align="center">Ref</td>
<td valign="top" align="center"/>
<td valign="top" align="center"><bold>0.001</bold></td>
</tr>
<tr>
<td valign="top" align="left">Moderately differentiated</td>
<td valign="top" align="left">4.064</td>
<td valign="top" align="center">[2.306,7.160]</td>
<td valign="top" align="center">&#x003C;0.001</td>
<td valign="top" align="center">3.057</td>
<td valign="top" align="center">[1.577,6.339]</td>
<td valign="top" align="center">0.002</td>
</tr>
<tr>
<td valign="top" align="left">Poorly differentiated</td>
<td valign="top" align="left">7.867</td>
<td valign="top" align="center">[4.319,14.329]</td>
<td valign="top" align="center">&#x003C;0.001</td>
<td valign="top" align="center">4.523</td>
<td valign="top" align="center">[2.197,9.83]</td>
<td valign="top" align="center">&#x003C;0.001</td>
</tr>
<tr>
<td valign="top" align="left">Undifferentiated/Anaplastic</td>
<td valign="top" align="left">5</td>
<td valign="top" align="center">[0.526,47.525]</td>
<td valign="top" align="center">0.161</td>
<td valign="top" align="center">8.396</td>
<td valign="top" align="center">[0.277,105.622]</td>
<td valign="top" align="center">0.15</td>
</tr>
<tr>
<td valign="top" align="left" rowspan="4">T stage</td>
<td valign="top" align="left">Ta-T1</td>
<td valign="top" align="center">Ref</td>
<td valign="top" align="center"/>
<td valign="top" align="center"><bold>&#x003C;0.001</bold></td>
<td valign="top" align="center">Ref</td>
<td valign="top" align="center"/>
<td valign="top" align="center"><bold>0.05</bold></td>
</tr>
<tr>
<td valign="top" align="left">T2</td>
<td valign="top" align="left">3.874</td>
<td valign="top" align="center">[2.522,5.951]</td>
<td valign="top" align="center">&#x003C;0.001</td>
<td valign="top" align="center">1.651</td>
<td valign="top" align="center">[0.955,2.872]</td>
<td valign="top" align="center">0.073</td>
</tr>
<tr>
<td valign="top" align="left">T3</td>
<td valign="top" align="left">6.039</td>
<td valign="top" align="center">[3.802,9.594]</td>
<td valign="top" align="center">&#x003C;0.001</td>
<td valign="top" align="center">2.199</td>
<td valign="top" align="center">[1.21,4.008]</td>
<td valign="top" align="center">0.01</td>
</tr>
<tr>
<td valign="top" align="left">T4</td>
<td valign="top" align="left">10.542</td>
<td valign="top" align="center">[2.272,48.910]</td>
<td valign="top" align="center">0.003</td>
<td valign="top" align="center">4.64</td>
<td valign="top" align="center">[0.461,41.547]</td>
<td valign="top" align="center">0.183</td>
</tr>
<tr>
<td valign="top" align="left" rowspan="2">ILND</td>
<td valign="top" align="left">No/Biopsy only</td>
<td valign="top" align="center">Ref</td>
<td valign="top" align="center"/>
<td valign="top" align="center" rowspan="2"><bold>&#x003C;0.001</bold></td>
<td valign="top" align="center">Ref</td>
<td valign="top" align="center"/>
<td valign="top" align="center" rowspan="2"><bold>&#x003C;0.001</bold></td>
</tr>
<tr>
<td valign="top" align="left">Yes</td>
<td valign="top" align="left">15.03</td>
<td valign="top" align="center">[10.172,22.209]</td>
<td valign="top" align="center">11.044</td>
<td valign="top" align="center">[6.984,17.846]</td>
</tr>
<tr>
<td valign="top" align="left" rowspan="2">LVI</td>
<td valign="top" align="left">Absent/Unknown</td>
<td valign="top" align="center">Ref</td>
<td valign="top" align="center"/>
<td valign="top" align="center" rowspan="2"><bold>&#x003C;0.001</bold></td>
<td valign="top" align="center">Ref</td>
<td valign="top" align="center"/>
<td valign="top" align="center" rowspan="2">0.078</td>
</tr>
<tr>
<td valign="top" align="left">Present</td>
<td valign="top" align="left">4.039</td>
<td valign="top" align="center">[2.624,6.218]</td>
<td valign="top" align="center">1.689</td>
<td valign="top" align="center">[0.937,3.016]</td>
</tr>
<tr>
<td valign="top" align="left" rowspan="2">Radiotherapy</td>
<td valign="top" align="left">No/Unknown</td>
<td valign="top" align="center">Ref</td>
<td valign="top" align="center"/>
<td valign="top" align="center" rowspan="2"><bold>&#x003C;0.001</bold></td>
<td valign="top" align="center">Ref</td>
<td valign="top" align="center"/>
<td valign="top" align="center" rowspan="2"><bold>&#x003C;0.001</bold></td>
</tr>
<tr>
<td valign="top" align="left">Yes</td>
<td valign="top" align="left">6.372</td>
<td valign="top" align="center">[3.916,10.369]</td>
<td valign="top" align="center">4.64</td>
<td valign="top" align="center">[2.361,9.145]</td>
</tr>
<tr>
<td valign="top" align="left" rowspan="2">Chemotherapy</td>
<td valign="top" align="left">No/Unknown</td>
<td valign="top" align="center">Ref</td>
<td valign="top" align="center"/>
<td valign="top" align="center" rowspan="2"><bold>&#x003C;0.001</bold></td>
<td valign="top" align="center">Ref</td>
<td valign="top" align="center"/>
<td valign="top" align="center" rowspan="2"><bold>&#x003C;0.001</bold></td>
</tr>
<tr>
<td valign="top" align="left">Yes</td>
<td valign="top" align="left">18.36</td>
<td valign="top" align="center">[10.743,31.378]</td>
<td valign="top" align="center">9.612</td>
<td valign="top" align="center">[4.971,19.138]</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn id="table-fn2"><p>OR, odds ratio; CI, confidence intervals; ILND, Inguinal lymph node dissection; LVI, Lymph-vascular Invasion, Other status including single, divorced, separated, divorced and unknown.</p></fn>
</table-wrap-foot>
</table-wrap>
</sec>
<sec id="s3d"><title>Performance of ML algorithms</title>
<p>To compare the predictive efficiency of the five ML algorithm models, ten-fold cross validation was applied in this study (<xref ref-type="fig" rid="F3">Figure&#x00A0;3</xref>). Both the RF model (AUC&#x2009;&#x003D;&#x2009;0.924, 95&#x0025; CI&#x2009;&#x003D;&#x2009;0.902&#x2013;0.946) and the XGB model (AUC&#x2009;&#x003D;&#x2009;0.922, 95&#x0025; CI&#x2009;&#x003D;&#x2009;0.900&#x2013;0.945) performed well in the prediction of early-stage ILNM risk. The decision curve analysis of models was also subsequently constructed. The confusion matrix for ten-fold cross validation of training cohort is shown in <xref ref-type="table" rid="T3">Table&#x00A0;3</xref>. The learning curves of models in the training cohort are shown in <xref ref-type="sec" rid="s11">Supplementary Figure S2</xref>. For the external validation cohort, as shown in <xref ref-type="fig" rid="F4">Figure&#x00A0;4</xref>, the XGB model showed the best performance among the five algorithms according to receiver operating characteristic curve analysis (AUC&#x2009;&#x003D;&#x2009;0.853, 95&#x0025; CI&#x2009;&#x003D;&#x2009;0.743&#x2013;0.964). Since the XGB model was found to be stable and efficient in both the training and validation groups, we finally chose the XGB model (accuracy&#x2009;&#x003D;&#x2009;0.848, sensitivity&#x2009;&#x003D;&#x2009;0.887, specificity&#x2009;&#x003D;&#x2009;0.837 in the training cohort) as the final prediction model. Our ML algorithm model can be embedded in a web calculator or applet to allow clinicians to assess the risk of ILNM in patients with SCCP.</p>
<fig id="F3" position="float"><label>Figure 3</label>
<caption><p>(<bold>A&#x2013;F</bold>) Ten-fold cross ROC curves of five ML models in the training cohort. LR, logistic regression; XGB, eXtreme gradient boosting; RF, random forest; SVM, support vector machine; KNN, k-nearest neighbor. (<bold>G</bold>) Decision curve analysis graph showing the net benefit against threshold probabilities based on decisions from model outputs. The curves referred to as &#x201C;All&#x201D; represent the prediction that all the patients would progress to ILNM, and the curves referred to as &#x201C;None&#x201D; represent the prediction that no patients were ILNM.</p></caption>
<graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="fsurg-10-1095545-g003.tif"/>
</fig>
<fig id="F4" position="float"><label>Figure 4</label>
<caption><p>The ROC curve of five models in the external validation cohort.</p></caption>
<graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="fsurg-10-1095545-g004.tif"/>
</fig>
<table-wrap id="T3" position="float"><label>Table 3</label>
<caption><p>Confusion matrix for ten-fold cross validation of training cohort.</p></caption>
<table frame="hsides" rules="groups">
<colgroup>
<col align="left"/>
<col align="center"/>
<col align="center"/>
<col align="center"/>
<col align="center"/>
</colgroup>
<thead>
<tr>
<th valign="top" align="left"/>
<th valign="top" align="center">Accuracy</th>
<th valign="top" align="center">Recall</th>
<th valign="top" align="center">Precision</th>
<th valign="top" align="center">F1-Measure</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">XGB</td>
<td valign="top" align="center">0.867</td>
<td valign="top" align="center">0.867</td>
<td valign="top" align="center">0.86</td>
<td valign="top" align="center">0.857</td>
</tr>
<tr>
<td valign="top" align="left">LR</td>
<td valign="top" align="center">0.883</td>
<td valign="top" align="center">0.883</td>
<td valign="top" align="center">0.871</td>
<td valign="top" align="center">0.867</td>
</tr>
<tr>
<td valign="top" align="left">RF</td>
<td valign="top" align="center">0.863</td>
<td valign="top" align="center">0.863</td>
<td valign="top" align="center">0.853</td>
<td valign="top" align="center">0.852</td>
</tr>
<tr>
<td valign="top" align="left">SVM</td>
<td valign="top" align="center">0.873</td>
<td valign="top" align="center">0.873</td>
<td valign="top" align="center">0.859</td>
<td valign="top" align="center">0.851</td>
</tr>
<tr>
<td valign="top" align="left">kNN</td>
<td valign="top" align="center">0.869</td>
<td valign="top" align="center">0.869</td>
<td valign="top" align="center">0.861</td>
<td valign="top" align="center">0.861</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="s3e"><title>Relative importance of variables</title>
<p>The importance of patient clinical features in the XGB model is shown in <xref ref-type="fig" rid="F5">Figure&#x00A0;5</xref>, and is listed here in descending order of importance: ILND, chemotherapy, radiotherapy, tumor grade, and T stage.</p>
<fig id="F5" position="float"><label>Figure 5</label>
<caption><p>The XGB model was used to calculate the importance of each feature. The bar chart depicts the relative significance of the variables.</p></caption>
<graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="fsurg-10-1095545-g005.tif"/>
</fig>
</sec>
</sec>
<sec id="s4" sec-type="discussion"><title>Discussion</title>
<p>The occurrence of ILNM in SCCP is associated with poor patient prognosis. ILND is the most important procedure for the prevention and treatment of ILNM (<xref ref-type="bibr" rid="B29">29</xref>). However, surgeons must consider the balance between the survival benefit to the patient and the high incidence of postoperative complications (<xref ref-type="bibr" rid="B30">30</xref>). The use of dynamic anterior node biopsy has been advocated to avoid unnecessary ILND, but the risk of false-negative results remains unavoidable (<xref ref-type="bibr" rid="B31">31</xref>), thus threatening the postoperative quality of patient survival. Therefore, early and accurate prediction of LNM is imminent. Previous studies on the SEER database suggest that age at diagnosis, tumor grade, tumor size, T stage, primary site, and LVI may be predictors of ILNM. However, these studies did not take into account the postoperative adjuvant therapy received by the patients. The models based on these variables had AUC of 0.776 and 0.795, respectively (<xref ref-type="bibr" rid="B20">20</xref>, <xref ref-type="bibr" rid="B21">21</xref>). The advent of ML algorithms has made it possible to improve model performance.</p>
<p>In this study, we included SCCP patients no distant metastases and non-N3 stage, and developed an accurate predictive model for predicting the risk of early-stage ILNM based on multiple clinical and pathological indicators. Our aim is to screen the SCCP population with a high risk of ILNM for more careful perioperative management of this group of patients, with the ultimate goal of improving patient prognosis. To the best of our knowledge, this is the first model based on a variety of ML algorithms to predict early-stage ILNM with big data and performing external validation. This study included 1,056 cases of SCCP from the SEER database for model establishment and 74 cases from an independent institution in China for external validation. We adopted five ML methods: LR, XGB, RF, SVM, and KNN. By integrating the findings related to the effectiveness and stability of the models in the training and external validation groups, we finally identified XGB as the best prediction model algorithm for early-stage ILNM risk prediction. In the training cohort, the XGB algorithm model (AUC&#x2009;&#x003D;&#x2009;0.922, 95&#x0025; CI&#x2009;&#x003D;&#x2009;0.900&#x2013;0.945) showed superior performance and also performed well in the external validation. The model can be embedded as a web calculator or applied by way of a mobile terminal application. By entering the values or classification results of each indicator, the individual risk of progression can be calculated and, for patients at high risk, more aggressive physical examination, imaging, adjuvant therapy or even surgery should be performed postoperatively.</p>
<p>In both the baseline analysis and the univariate regression, a lower proportion of married than unmarried individuals had early-stage ILNM. This might partly be attributable to the fact that married people tend to have better economic conditions and personal hygiene. In addition, having physical intimacy with a partner increases the likelihood of detecting masses in the groin area and visiting a hospital at an earlier stage of the disease. In our study, the site of the primary tumor did not show a significant association with ILNM risk, but this is not consistent with the findings of previous studies (<xref ref-type="bibr" rid="B21">21</xref>). Because delayed intervention can adversely affect the survival of patients with PC diagnosed with lymph node involvement, treatment guidelines recommend lymph node dissection. Therefore, management of regional lymph nodes is very important for patient survival (<xref ref-type="bibr" rid="B32">32</xref>). Our findings indicate the importance of ILND for the detection of early-stage ILNM. LVI is defined as infiltration of tumor cells in the lymphatic or hematologic system. Previous studies have shown that LVI is significantly associated with lymph node metastasis and distant metastasis (<xref ref-type="bibr" rid="B33">33</xref>). Recently, there is evidence that the presence of LVI is an important risk factor for occult micrometastases in patients with penile cancer and affects the overall survival of patients (<xref ref-type="bibr" rid="B34">34</xref>). The correlation of risk with T stage and nuclear grade observed in the present study is in line with previous literature (<xref ref-type="bibr" rid="B21">21</xref>, <xref ref-type="bibr" rid="B34">34</xref>). Meanwhile, patients with indications for radiation and chemotherapy, have a higher risk of developing early ILNM, based on clinician judgment.</p>
<p>Our study has certain limitations. First, the number of patients used for external validation at our center is small, and we hope to further improve it at a later stage through multi-center collaboration. Second, ML algorithms are inconvenient for use in clinical practice, and we hope to develop an online calculator app of our XGB model for clinicians in the future. In addition, there are also some limitations to the data in the SEER database. The lack of data on immunohistochemistry, genomics, patient physical indicators, underlying diseases, and hematological indicators reduces the possibility of improving the accuracy of the model, and we hope to remedy this through the establishment of a multicenter database. In addition, the practical value of the model was determined in a predominantly Caucasian database, so its applicability in other regions (including China) is unclear due to the inevitable differences in ethnicity and treatment levels in different countries/regions. Finally, the indications for ILND or adjuvant therapy vary from one medical center to another, so there may be some errors in its practical application. Nevertheless, our study yielded encouraging results that ML algorithms appear to have greater efficacy potential for early ILNM risk prediction in patients with SCCP compared to traditional logistic regression analysis.</p>
</sec>
<sec id="s5" sec-type="conclusions"><title>Conclusion</title>
<p>We have built a precise, big data-based ML model for predicting early-stage ILNM in patients with SCCP. External validation proved that our novel model has excellent predictive accuracy and clinical utility. Therefore, in the future, it may guide clinicians&#x0027; decisions and improve the long-term prognosis of patients.</p>
</sec>
</body>
<back>
<sec id="s6" sec-type="data-availability"><title>Data availability statement</title>
<p>The raw data supporting the conclusions of this article will be made available by the authors, without undue reservation.</p>
</sec>
<sec id="s7"><title>Ethics statement</title>
<p>The studies involving human participants were reviewed and approved by the Ethics Committee of the Affiliated Hospital of Xuzhou Medical University. Written informed consent for participation was not required for this study in accordance with the national legislation and the institutional requirements.</p>
</sec>
<sec id="s8"><title>Author contributions</title>
<p>LD,CZ,KW contributed to the idea and design. CZ, KW, YZ collected and analyzed the data. LD, CW, WX, SL drew the figures and tables. LD and CZ wrote the draft. LD, CZ, KW, YZ, CW, WX, SL, WL and JW contributed to manuscript writing and revision. All authors contributed to the article and approved the submitted version.</p>
</sec>
<sec id="s9" sec-type="funding-information"><title>Funding</title>
<p>This work was supported by The second round of Xuzhou Medical Leading Talents Training Project (XWRCHT20210027).</p>
</sec>
<sec id="s10" sec-type="COI-statement"><title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec id="s12" sec-type="disclaimer"><title>Publisher&#x0027;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec id="s11" sec-type="supplementary-material"><title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fsurg.2023.1095545/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fsurg.2023.1095545/full&#x0023;supplementary-material</ext-link>.</p>
<supplementary-material id="SD1" content-type="local-data">
<media mimetype="application" mime-subtype="" xlink:href="Table1.xlsx"/>
</supplementary-material>
<supplementary-material id="SD2" content-type="local-data">
<media mimetype="application" mime-subtype="" xlink:href="Table2.xlsx"/>
</supplementary-material>
<supplementary-material id="SD3" content-type="local-data">
<media mimetype="image" mime-subtype="tiff" xlink:href="Image1.tif"/>
</supplementary-material>
<supplementary-material id="SD4" content-type="local-data">
<media mimetype="image" mime-subtype="tiff" xlink:href="Image2.tif"/>
</supplementary-material>
</sec>
<ref-list><title>References</title>
<ref id="B1"><label>1.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>O&#x0027;Sullivan</surname><given-names>B</given-names></name><name><surname>Brierley</surname><given-names>J</given-names></name><name><surname>Byrd</surname><given-names>D</given-names></name><name><surname>Bosman</surname><given-names>F</given-names></name><name><surname>Kehoe</surname><given-names>S</given-names></name><name><surname>Kossary</surname><given-names>C</given-names></name><etal/></person-group> <article-title>The tnm classification of malignant tumours-towards common understanding and reasonable expectations</article-title>. <source>Lancet Oncol</source>. (<year>2017</year>) <volume>18</volume>:<fpage>849</fpage>&#x2013;<lpage>51</lpage>. <pub-id pub-id-type="doi">10.1016/S1470-2045(17)30438-2</pub-id></citation></ref>
<ref id="B2"><label>2.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Siegel</surname><given-names>RL</given-names></name><name><surname>Miller</surname><given-names>KD</given-names></name><name><surname>Jemal</surname><given-names>A</given-names></name></person-group>. <article-title>Cancer statistics, 2019</article-title>. <source>Ca Cancer J Clin</source>. (<year>2019</year>) <volume>69</volume>:<fpage>7</fpage>&#x2013;<lpage>34</lpage>. <pub-id pub-id-type="doi">10.3322/caac.21551</pub-id><pub-id pub-id-type="pmid">30620402</pub-id></citation></ref>
<ref id="B3"><label>3.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bray</surname><given-names>F</given-names></name><name><surname>Klint</surname><given-names>A</given-names></name><name><surname>Gislum</surname><given-names>M</given-names></name><name><surname>Hakulinen</surname><given-names>T</given-names></name><name><surname>Engholm</surname><given-names>G</given-names></name><name><surname>Tryggvadottir</surname><given-names>L</given-names></name><etal/></person-group> <article-title>Trends in survival of patients diagnosed with male genital cancers in the nordic countries 1964-2003 followed up until the end of 2006</article-title>. <source>Acta Oncol</source>. (<year>2010</year>) <volume>49</volume>:<fpage>644</fpage>&#x2013;<lpage>54</lpage>. <pub-id pub-id-type="doi">10.3109/02841860903575315</pub-id><pub-id pub-id-type="pmid">20151937</pub-id></citation></ref>
<ref id="B4"><label>4.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Backes</surname><given-names>DM</given-names></name><name><surname>Kurman</surname><given-names>RJ</given-names></name><name><surname>Pimenta</surname><given-names>JM</given-names></name><name><surname>Smith</surname><given-names>JS</given-names></name></person-group>. <article-title>Systematic review of human papillomavirus prevalence in invasive penile cancer</article-title>. <source>Cancer Causes Control</source>. (<year>2009</year>) <volume>20</volume>:<fpage>449</fpage>&#x2013;<lpage>57</lpage>. <pub-id pub-id-type="doi">10.1007/s10552-008-9276-9</pub-id><pub-id pub-id-type="pmid">19082746</pub-id></citation></ref>
<ref id="B5"><label>5.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Coelho</surname><given-names>R</given-names></name><name><surname>Pinho</surname><given-names>JD</given-names></name><name><surname>Moreno</surname><given-names>JS</given-names></name><name><surname>Garbis</surname><given-names>D</given-names></name><name><surname>Do</surname><given-names>NA</given-names></name><name><surname>Larges</surname><given-names>JS</given-names></name><etal/></person-group> <article-title>Penile cancer in maranhao, northeast Brazil: the highest incidence globally?</article-title> <source>Bmc Urol</source>. (<year>2018</year>) <volume>18</volume>:<fpage>50</fpage>. <pub-id pub-id-type="doi">10.1186/s12894-018-0365-0</pub-id><pub-id pub-id-type="pmid">29843769</pub-id></citation></ref>
<ref id="B6"><label>6.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Maden</surname><given-names>C</given-names></name><name><surname>Sherman</surname><given-names>KJ</given-names></name><name><surname>Beckmann</surname><given-names>AM</given-names></name><name><surname>Hislop</surname><given-names>TG</given-names></name><name><surname>Teh</surname><given-names>CZ</given-names></name><name><surname>Ashley</surname><given-names>RL</given-names></name><etal/></person-group> <article-title>History of circumcision, medical conditions, and sexual activity and risk of penile cancer</article-title>. <source>J Natl Cancer Inst</source>. (<year>1993</year>) <volume>85</volume>:<fpage>19</fpage>&#x2013;<lpage>24</lpage>. <pub-id pub-id-type="doi">10.1093/jnci/85.1.19</pub-id><pub-id pub-id-type="pmid">8380060</pub-id></citation></ref>
<ref id="B7"><label>7.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Koifman</surname><given-names>L</given-names></name><name><surname>Vides</surname><given-names>AJ</given-names></name><name><surname>Koifman</surname><given-names>N</given-names></name><name><surname>Carvalho</surname><given-names>JP</given-names></name><name><surname>Ornellas</surname><given-names>AA</given-names></name></person-group>. <article-title>Epidemiological aspects of penile cancer in rio de janeiro: evaluation of 230 cases</article-title>. <source>Int Braz J Urol</source>. (<year>2011</year>) <volume>37</volume>:<fpage>231</fpage>&#x2013;<lpage>40</lpage>, <comment>240-3</comment>. <pub-id pub-id-type="doi">10.1590/s1677-55382011000200010</pub-id><pub-id pub-id-type="pmid">21557840</pub-id></citation></ref>
<ref id="B8"><label>8.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Erbersdobler</surname><given-names>A</given-names></name></person-group>. <article-title>Pathologic evaluation and reporting of carcinoma of the penis</article-title>. <source>Clin Genitourin Cancer</source>. (<year>2017</year>) <volume>15</volume>:<fpage>192</fpage>&#x2013;<lpage>5</lpage>. <pub-id pub-id-type="doi">10.1016/j.clgc.2016.08.003</pub-id><pub-id pub-id-type="pmid">27594553</pub-id></citation></ref>
<ref id="B9"><label>9.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Christodoulidou</surname><given-names>M</given-names></name><name><surname>Sahdev</surname><given-names>V</given-names></name><name><surname>Houssein</surname><given-names>S</given-names></name><name><surname>Muneer</surname><given-names>A</given-names></name></person-group>. <article-title>Epidemiology of penile cancer</article-title>. <source>Curr Probl Cancer</source>. (<year>2015</year>) <volume>39</volume>:<fpage>126</fpage>&#x2013;<lpage>36</lpage>. <pub-id pub-id-type="doi">10.1016/j.currproblcancer.2015.03.010</pub-id><pub-id pub-id-type="pmid">26076979</pub-id></citation></ref>
<ref id="B10"><label>10.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Audenet</surname><given-names>F</given-names></name><name><surname>Sfakianos</surname><given-names>JP</given-names></name></person-group>. <article-title>Psychosocial impact of penile carcinoma</article-title>. <source>Transl Androl Urol</source>. (<year>2017</year>) <volume>6</volume>:<fpage>874</fpage>&#x2013;<lpage>8</lpage>. <pub-id pub-id-type="doi">10.21037/tau.2017.07.24</pub-id><pub-id pub-id-type="pmid">29184785</pub-id></citation></ref>
<ref id="B11"><label>11.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Leijte</surname><given-names>JA</given-names></name><name><surname>Kirrander</surname><given-names>P</given-names></name><name><surname>Antonini</surname><given-names>N</given-names></name><name><surname>Windahl</surname><given-names>T</given-names></name><name><surname>Horenblas</surname><given-names>S</given-names></name></person-group>. <article-title>Recurrence patterns of squamous cell carcinoma of the penis: recommendations for follow-up based on a two-centre analysis of 700 patients</article-title>. <source>Eur Urol</source>. (<year>2008</year>) <volume>54</volume>:<fpage>161</fpage>&#x2013;<lpage>8</lpage>. <pub-id pub-id-type="doi">10.1016/j.eururo.2008.04.016</pub-id><pub-id pub-id-type="pmid">18440124</pub-id></citation></ref>
<ref id="B12"><label>12.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wen</surname><given-names>S</given-names></name><name><surname>Ren</surname><given-names>W</given-names></name><name><surname>Xue</surname><given-names>B</given-names></name><name><surname>Fan</surname><given-names>Y</given-names></name><name><surname>Jiang</surname><given-names>Y</given-names></name><name><surname>Zeng</surname><given-names>C</given-names></name><etal/></person-group> <article-title>Prognostic factors in patients with penile cancer after surgical management</article-title>. <source>World J Urol</source>. (<year>2018</year>) <volume>36</volume>:<fpage>435</fpage>&#x2013;<lpage>40</lpage>. <pub-id pub-id-type="doi">10.1007/s00345-017-2167-5</pub-id><pub-id pub-id-type="pmid">29299663</pub-id></citation></ref>
<ref id="B13"><label>13.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hakenberg</surname><given-names>OW</given-names></name><name><surname>Comperat</surname><given-names>EM</given-names></name><name><surname>Minhas</surname><given-names>S</given-names></name><name><surname>Necchi</surname><given-names>A</given-names></name><name><surname>Protzel</surname><given-names>C</given-names></name><name><surname>Watkin</surname><given-names>N</given-names></name></person-group>. <article-title>Eau guidelines on penile cancer: 2014 update</article-title>. <source>Eur Urol</source>. (<year>2015</year>) <volume>67</volume>:<fpage>142</fpage>&#x2013;<lpage>50</lpage>. <pub-id pub-id-type="doi">10.1016/j.eururo.2014.10.017</pub-id><pub-id pub-id-type="pmid">25457021</pub-id></citation></ref>
<ref id="B14"><label>14.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Srinivas</surname><given-names>V</given-names></name><name><surname>Morse</surname><given-names>MJ</given-names></name><name><surname>Herr</surname><given-names>HW</given-names></name><name><surname>Sogani</surname><given-names>PC</given-names></name><name><surname>Whitmore</surname><given-names>WJ</given-names></name></person-group>. <article-title>Penile cancer: relation of extent of nodal metastasis to survival</article-title>. <source>J Urol</source>. (<year>1987</year>) <volume>137</volume>:<fpage>880</fpage>&#x2013;<lpage>2</lpage>. <pub-id pub-id-type="doi">10.1016/s0022-5347(17)44281-9</pub-id><pub-id pub-id-type="pmid">3573181</pub-id></citation></ref>
<ref id="B15"><label>15.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bandieramonte</surname><given-names>G</given-names></name><name><surname>Colecchia</surname><given-names>M</given-names></name><name><surname>Mariani</surname><given-names>L</given-names></name><name><surname>Lo</surname><given-names>VS</given-names></name><name><surname>Pizzocaro</surname><given-names>G</given-names></name><name><surname>Piva</surname><given-names>L</given-names></name><etal/></person-group> <article-title>Peniscopically controlled co2 laser excision for conservative treatment of in situ and t1 penile carcinoma: report on 224 patients</article-title>. <source>Eur Urol</source>. (<year>2008</year>) <volume>54</volume>:<fpage>875</fpage>&#x2013;<lpage>82</lpage>. <pub-id pub-id-type="doi">10.1016/j.eururo.2008.01.019</pub-id><pub-id pub-id-type="pmid">18243513</pub-id></citation></ref>
<ref id="B16"><label>16.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lopes</surname><given-names>A</given-names></name><name><surname>Hidalgo</surname><given-names>GS</given-names></name><name><surname>Kowalski</surname><given-names>LP</given-names></name><name><surname>Torloni</surname><given-names>H</given-names></name><name><surname>Rossi</surname><given-names>BM</given-names></name><name><surname>Fonseca</surname><given-names>FP</given-names></name></person-group>. <article-title>Prognostic factors in carcinoma of the penis: multivariate analysis of 145 patients treated with amputation and lymphadenectomy</article-title>. <source>J Urol</source>. (<year>1996</year>) <volume>156</volume>:<fpage>1637</fpage>&#x2013;<lpage>42</lpage>. <pub-id pub-id-type="doi">10.1016/s0022-5347(01)65471-5</pub-id><pub-id pub-id-type="pmid">8863559</pub-id></citation></ref>
<ref id="B17"><label>17.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Slaton</surname><given-names>JW</given-names></name><name><surname>Morgenstern</surname><given-names>N</given-names></name><name><surname>Levy</surname><given-names>DA</given-names></name><name><surname>Santos</surname><given-names>MJ</given-names></name><name><surname>Tamboli</surname><given-names>P</given-names></name><name><surname>Ro</surname><given-names>JY</given-names></name><etal/></person-group> <article-title>Tumor stage, vascular invasion and the percentage of poorly differentiated cancer: independent prognosticators for inguinal lymph node metastasis in penile squamous cancer</article-title>. <source>J Urol</source>. (<year>2001</year>) <volume>165</volume>:<fpage>1138</fpage>&#x2013;<lpage>42</lpage>. <pub-id pub-id-type="doi">10.1016/S0022-5347(05)66450-6</pub-id><pub-id pub-id-type="pmid">11257655</pub-id></citation></ref>
<ref id="B18"><label>18.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ficarra</surname><given-names>V</given-names></name><name><surname>Zattoni</surname><given-names>F</given-names></name><name><surname>Cunico</surname><given-names>SC</given-names></name><name><surname>Galetti</surname><given-names>TP</given-names></name><name><surname>Luciani</surname><given-names>L</given-names></name><name><surname>Fandella</surname><given-names>A</given-names></name><etal/></person-group> <article-title>Lymphatic and vascular embolizations are independent predictive variables of inguinal lymph node involvement in patients with squamous cell carcinoma of the penis: gruppo uro-oncologico del nord est (northeast uro-oncological group) penile cancer data base data</article-title>. <source>Cancer</source>. (<year>2005</year>) <volume>103</volume>:<fpage>2507</fpage>&#x2013;<lpage>16</lpage>. <pub-id pub-id-type="doi">10.1002/cncr.21076</pub-id><pub-id pub-id-type="pmid">15856474</pub-id></citation></ref>
<ref id="B19"><label>19.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Peak</surname><given-names>TC</given-names></name><name><surname>Russell</surname><given-names>GB</given-names></name><name><surname>Dutta</surname><given-names>R</given-names></name><name><surname>Rothberg</surname><given-names>MB</given-names></name><name><surname>Chapple</surname><given-names>AG</given-names></name><name><surname>Hemal</surname><given-names>AK</given-names></name></person-group>. <article-title>A national cancer database-based nomogram to predict lymph node metastasis in penile cancer</article-title>. <source>Bju Int</source>. (<year>2019</year>) <volume>123</volume>:<fpage>1005</fpage>&#x2013;<lpage>10</lpage>. <pub-id pub-id-type="doi">10.1111/bju.14652</pub-id><pub-id pub-id-type="pmid">30548161</pub-id></citation></ref>
<ref id="B20"><label>20.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Shao</surname><given-names>Y</given-names></name><name><surname>Tu</surname><given-names>X</given-names></name><name><surname>Liu</surname><given-names>Y</given-names></name><name><surname>Bao</surname><given-names>Y</given-names></name><name><surname>Ren</surname><given-names>S</given-names></name><name><surname>Yang</surname><given-names>Z</given-names></name><etal/></person-group> <article-title>Predict lymph node metastasis in penile cancer using clinicopathological factors and nomograms</article-title>. <source>Cancer Manag Res</source>. (<year>2021</year>) <volume>13</volume>:<fpage>7429</fpage>&#x2013;<lpage>37</lpage>. <pub-id pub-id-type="doi">10.2147/CMAR.S329925</pub-id><pub-id pub-id-type="pmid">34594135</pub-id></citation></ref>
<ref id="B21"><label>21.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhang</surname><given-names>W</given-names></name><name><surname>Gao</surname><given-names>P</given-names></name><name><surname>Gao</surname><given-names>J</given-names></name><name><surname>Wu</surname><given-names>X</given-names></name><name><surname>Liu</surname><given-names>G</given-names></name><name><surname>Zhang</surname><given-names>X</given-names></name></person-group>. <article-title>A clinical nomogram for predicting lymph node metastasis in penile cancer: a seer-based study</article-title>. <source>Front Oncol</source>. (<year>2021</year>) <volume>11</volume>:<fpage>640036</fpage>. <pub-id pub-id-type="doi">10.3389/fonc.2021.640036</pub-id><pub-id pub-id-type="pmid">33768001</pub-id></citation></ref>
<ref id="B22"><label>22.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kourou</surname><given-names>K</given-names></name><name><surname>Exarchos</surname><given-names>TP</given-names></name><name><surname>Exarchos</surname><given-names>KP</given-names></name><name><surname>Karamouzis</surname><given-names>MV</given-names></name><name><surname>Fotiadis</surname><given-names>DI</given-names></name></person-group>. <article-title>Machine learning applications in cancer prognosis and prediction</article-title>. <source>Comput Struct Biotechnol J</source>. (<year>2015</year>) <volume>13</volume>:<fpage>8</fpage>&#x2013;<lpage>17</lpage>. <pub-id pub-id-type="doi">10.1016/j.csbj.2014.11.005</pub-id><pub-id pub-id-type="pmid">25750696</pub-id></citation></ref>
<ref id="B23"><label>23.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ngabo</surname><given-names>D</given-names></name><name><surname>Dong</surname><given-names>W</given-names></name><name><surname>Ibeke</surname><given-names>E</given-names></name><name><surname>Iwendi</surname><given-names>C</given-names></name><name><surname>Masabo</surname><given-names>E</given-names></name></person-group>. <article-title>Tackling pandemics in smart cities using machine learning architecture</article-title>. <source>Math Biosci Eng</source>. (<year>2021</year>) <volume>18</volume>:<fpage>8444</fpage>&#x2013;<lpage>61</lpage>. <pub-id pub-id-type="doi">10.3934/mbe.2021418</pub-id><pub-id pub-id-type="pmid">34814307</pub-id></citation></ref>
<ref id="B24"><label>24.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Iwendi</surname><given-names>C</given-names></name><name><surname>Huescas</surname><given-names>CGY</given-names></name><name><surname>Chakraborty</surname><given-names>C</given-names></name><name><surname>Mohan</surname><given-names>S</given-names></name></person-group>. <article-title>COVID-19 health analysis and prediction using machine learning algorithms for Mexico and Brazil patients</article-title>. <source>J Exp Theor Artif Intell</source>. (<year>2022</year>) <volume>35</volume>(<issue>12</issue>):<fpage>1226</fpage>&#x2013;<lpage>37.e7</lpage>. <pub-id pub-id-type="doi">10.1080/0952813X.2022.2058097</pub-id></citation></ref>
<ref id="B25"><label>25.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Deo</surname><given-names>RC</given-names></name></person-group>. <article-title>Machine learning in medicine</article-title>. <source>Circulation</source>. (<year>2015</year>) <volume>132</volume>:<fpage>1920</fpage>&#x2013;<lpage>30</lpage>. <pub-id pub-id-type="doi">10.1161/CIRCULATIONAHA.115.001593</pub-id><pub-id pub-id-type="pmid">26572668</pub-id></citation></ref>
<ref id="B26"><label>26.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Vougas</surname><given-names>K</given-names></name><name><surname>Sakellaropoulos</surname><given-names>T</given-names></name><name><surname>Kotsinas</surname><given-names>A</given-names></name><name><surname>Foukas</surname><given-names>GP</given-names></name><name><surname>Ntargaras</surname><given-names>A</given-names></name><name><surname>Koinis</surname><given-names>F</given-names></name><etal/></person-group> <article-title>Machine learning and data mining frameworks for predicting drug response in cancer: an overview and a novel in silico screening process based on association rule mining</article-title>. <source>Pharmacol Ther</source>. (<year>2019</year>) <volume>203</volume>:<fpage>107395</fpage>. <pub-id pub-id-type="doi">10.1016/j.pharmthera.2019.107395</pub-id><pub-id pub-id-type="pmid">31374225</pub-id></citation></ref>
<ref id="B27"><label>27.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wei</surname><given-names>L</given-names></name><name><surname>Huang</surname><given-names>Y</given-names></name><name><surname>Chen</surname><given-names>Z</given-names></name><name><surname>Lei</surname><given-names>H</given-names></name><name><surname>Qin</surname><given-names>X</given-names></name><name><surname>Cui</surname><given-names>L</given-names></name><etal/></person-group> <article-title>Artificial intelligence combined with big data to predict lymph node involvement in prostate cancer: a population-based study</article-title>. <source>Front Oncol</source>. (<year>2021</year>) <volume>11</volume>:<fpage>763381</fpage>. <pub-id pub-id-type="doi">10.3389/fonc.2021.763381</pub-id><pub-id pub-id-type="pmid">34722318</pub-id></citation></ref>
<ref id="B28"><label>28.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Li</surname><given-names>W</given-names></name><name><surname>Zhou</surname><given-names>Q</given-names></name><name><surname>Liu</surname><given-names>W</given-names></name><name><surname>Xu</surname><given-names>C</given-names></name><name><surname>Tang</surname><given-names>ZR</given-names></name><name><surname>Dong</surname><given-names>S</given-names></name><etal/></person-group> <article-title>A machine learning-based predictive model for predicting lymph node metastasis in patients with ewing&#x0027;s sarcoma</article-title>. <source>Front Med (Lausanne)</source>. (<year>2022</year>) <volume>9</volume>:<fpage>832108</fpage>. <pub-id pub-id-type="doi">10.3389/fmed.2022.832108</pub-id><pub-id pub-id-type="pmid">35463005</pub-id></citation></ref>
<ref id="B29"><label>29.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Alkatout</surname><given-names>I</given-names></name><name><surname>Naumann</surname><given-names>CM</given-names></name><name><surname>Hedderich</surname><given-names>J</given-names></name><name><surname>Hegele</surname><given-names>A</given-names></name><name><surname>Bolenz</surname><given-names>C</given-names></name><name><surname>Junemann</surname><given-names>KP</given-names></name><etal/></person-group> <article-title>Squamous cell carcinoma of the penis: predicting nodal metastases by histologic grade, pattern of invasion and clinical examination</article-title>. <source>Urol Oncol</source>. (<year>2011</year>) <volume>29</volume>:<fpage>774</fpage>&#x2013;<lpage>81</lpage>. <pub-id pub-id-type="doi">10.1016/j.urolonc.2009.10.014</pub-id><pub-id pub-id-type="pmid">20060332</pub-id></citation></ref>
<ref id="B30"><label>30.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Pettaway</surname><given-names>CA</given-names></name><name><surname>Pagliaro</surname><given-names>L</given-names></name><name><surname>Theodore</surname><given-names>C</given-names></name><name><surname>Haas</surname><given-names>G</given-names></name></person-group>. <article-title>Treatment of visceral, unresectable, or bulky/unresectable regional metastases of penile cancer</article-title>. <source>Urology</source>. (<year>2010</year>) <volume>76</volume>:<fpage>S58</fpage>&#x2013;<lpage>65</lpage>. <pub-id pub-id-type="doi">10.1016/j.urology.2010.03.082</pub-id><pub-id pub-id-type="pmid">20691886</pub-id></citation></ref>
<ref id="B31"><label>31.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lam</surname><given-names>W</given-names></name><name><surname>Alnajjar</surname><given-names>HM</given-names></name><name><surname>La-Touche</surname><given-names>S</given-names></name><name><surname>Perry</surname><given-names>M</given-names></name><name><surname>Sharma</surname><given-names>D</given-names></name><name><surname>Corbishley</surname><given-names>C</given-names></name><etal/></person-group> <article-title>Dynamic sentinel lymph node biopsy in patients with invasive squamous cell carcinoma of the penis: a prospective study of the long-term outcome of 500 inguinal basins assessed at a single institution</article-title>. <source>Eur Urol</source>. (<year>2013</year>) <volume>63</volume>:<fpage>657</fpage>&#x2013;<lpage>63</lpage>. <pub-id pub-id-type="doi">10.1016/j.eururo.2012.10.035</pub-id><pub-id pub-id-type="pmid">23153743</pub-id></citation></ref>
<ref id="B32"><label>32.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kroon</surname><given-names>BK</given-names></name><name><surname>Horenblas</surname><given-names>S</given-names></name><name><surname>Lont</surname><given-names>AP</given-names></name><name><surname>Tanis</surname><given-names>PJ</given-names></name><name><surname>Gallee</surname><given-names>MP</given-names></name><name><surname>Nieweg</surname><given-names>OE</given-names></name></person-group>. <article-title>Patients with penile carcinoma benefit from immediate resection of clinically occult lymph node metastases</article-title>. <source>J Urol</source>. (<year>2005</year>) <volume>173</volume>:<fpage>816</fpage>&#x2013;<lpage>9</lpage>. <pub-id pub-id-type="doi">10.1097/01.ju.0000154565.37397.4d</pub-id><pub-id pub-id-type="pmid">15711276</pub-id></citation></ref>
<ref id="B33"><label>33.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hamy</surname><given-names>AS</given-names></name><name><surname>Lam</surname><given-names>GT</given-names></name><name><surname>Laas</surname><given-names>E</given-names></name><name><surname>Darrigues</surname><given-names>L</given-names></name><name><surname>Balezeau</surname><given-names>T</given-names></name><name><surname>Guerin</surname><given-names>J</given-names></name><etal/></person-group> <article-title>Lymphovascular invasion after neoadjuvant chemotherapy is strongly associated with poor prognosis in breast carcinoma</article-title>. <source>Breast Cancer Res Treat</source>. (<year>2018</year>) <volume>169</volume>:<fpage>295</fpage>&#x2013;<lpage>304</lpage>. <pub-id pub-id-type="doi">10.1007/s10549-017-4610-0</pub-id><pub-id pub-id-type="pmid">29374852</pub-id></citation></ref>
<ref id="B34"><label>34.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Li</surname><given-names>K</given-names></name><name><surname>Sun</surname><given-names>J</given-names></name><name><surname>Wei</surname><given-names>X</given-names></name><name><surname>Wu</surname><given-names>G</given-names></name><name><surname>Wang</surname><given-names>F</given-names></name><name><surname>Fan</surname><given-names>C</given-names></name><etal/></person-group> <article-title>Prognostic value of lymphovascular invasion in patients with squamous cell carcinoma of the penis following surgery</article-title>. <source>Bmc Cancer</source>. (<year>2019</year>) <volume>19</volume>:<fpage>476</fpage>. <pub-id pub-id-type="doi">10.1186/s12885-019-5714-1</pub-id><pub-id pub-id-type="pmid">31113402</pub-id></citation></ref></ref-list>
</back>
</article>