<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.3 20210610//EN" "JATS-journalpublishing1-3-mathml3.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:ali="http://www.niso.org/schemas/ali/1.0/" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="1.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Oncol.</journal-id>
<journal-title-group>
<journal-title>Frontiers in Oncology</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Oncol.</abbrev-journal-title>
</journal-title-group>
<issn pub-type="epub">2234-943X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fonc.2026.1762494</article-id>
<article-version article-version-type="Version of Record" vocab="NISO-RP-8-2008"/>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Original Research</subject>
</subj-group>
</article-categories>
<title-group>
<article-title>Role of urinary leukocytes in the risk stratification of prostate cancer using nonlinear stacking learning strategy: a bi-cohort diagnostic study</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" equal-contrib="yes">
<name><surname>Xia</surname><given-names>Shou</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="author-notes" rid="fn003"><sup>&#x2020;</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
</contrib>
<contrib contrib-type="author" equal-contrib="yes">
<name><surname>Ran</surname><given-names>Zhenchun</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="author-notes" rid="fn003"><sup>&#x2020;</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/3307855/overview"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="resources" vocab-term-identifier="https://credit.niso.org/contributor-roles/resources/">Resources</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="visualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/visualization/">Visualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Cheng</surname><given-names>Mengzhe</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Project-administration" vocab-term-identifier="https://credit.niso.org/contributor-roles/project-administration/">Project administration</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="resources" vocab-term-identifier="https://credit.niso.org/contributor-roles/resources/">Resources</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="software" vocab-term-identifier="https://credit.niso.org/contributor-roles/software/">Software</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Zhu</surname><given-names>Hao</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="software" vocab-term-identifier="https://credit.niso.org/contributor-roles/software/">Software</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Yang</surname><given-names>Chunguang</given-names></name>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/970002/overview"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="resources" vocab-term-identifier="https://credit.niso.org/contributor-roles/resources/">Resources</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="supervision" vocab-term-identifier="https://credit.niso.org/contributor-roles/supervision/">Supervision</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Wu</surname><given-names>Xinglong</given-names></name>
<xref ref-type="aff" rid="aff5"><sup>5</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>*</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="resources" vocab-term-identifier="https://credit.niso.org/contributor-roles/resources/">Resources</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="supervision" vocab-term-identifier="https://credit.niso.org/contributor-roles/supervision/">Supervision</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="validation" vocab-term-identifier="https://credit.niso.org/contributor-roles/validation/">Validation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
</contrib>
</contrib-group>
<aff id="aff1"><label>1</label><institution>Xianning Polytechnic</institution>, <city>Xianning</city>,&#xa0;<country country="cn">China</country></aff>
<aff id="aff2"><label>2</label><institution>School of Computer Science and Engineering, Hubei Key Laboratory of Intelligent Robot, Wuhan Institute of Technology</institution>, <city>Wuhan</city>,&#xa0;<country country="cn">China</country></aff>
<aff id="aff3"><label>3</label><institution>Aerospace Nanhu Electronic Information Technology Co.</institution>, <city>Ltd.</city>, <state>Jingzhou</state>,&#xa0;<country country="cn">China</country></aff>
<aff id="aff4"><label>4</label><institution>Department of Urology, Tongji Hospital, Tongji Medical College, Huazhong University of Science and Technology</institution>, <city>Wuhan</city>,&#xa0;<country country="cn">China</country></aff>
<aff id="aff5"><label>5</label><institution>Xinjiang Key Laboratory of Artificial Intelligence Assisted Imaging Diagnosis</institution>, <city>Kashi</city>,&#xa0;<country country="cn">China</country></aff>
<author-notes>
<corresp id="c001"><label>*</label>Correspondence: Xinglong Wu, <email xlink:href="mailto:xwu@wit.edu.cn">xwu@wit.edu.cn</email></corresp>
<fn fn-type="equal" id="fn003">
<label>&#x2020;</label>
<p>These authors have contributed equally to this work</p></fn>
</author-notes>
<pub-date publication-format="electronic" date-type="pub" iso-8601-date="2026-03-02">
<day>02</day>
<month>03</month>
<year>2026</year>
</pub-date>
<pub-date publication-format="electronic" date-type="collection">
<year>2026</year>
</pub-date>
<volume>16</volume>
<elocation-id>1762494</elocation-id>
<history>
<date date-type="received">
<day>07</day>
<month>12</month>
<year>2025</year>
</date>
<date date-type="accepted">
<day>03</day>
<month>02</month>
<year>2026</year>
</date>
<date date-type="rev-recd">
<day>14</day>
<month>01</month>
<year>2026</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2026 Xia, Ran, Cheng, Zhu, Yang and Wu.</copyright-statement>
<copyright-year>2026</copyright-year>
<copyright-holder>Xia, Ran, Cheng, Zhu, Yang and Wu</copyright-holder>
<license>
<ali:license_ref start_date="2026-03-02">https://creativecommons.org/licenses/by/4.0/</ali:license_ref>
<license-p>This is an open-access article distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">Creative Commons Attribution License (CC BY)</ext-link>. The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</license-p>
</license>
</permissions>
<abstract>
<sec>
<title>Objective</title>
<p>This study aimed to develop a non-linear stacking ensemble learning framework to evaluate the incremental diagnostic contribution of urinary leukocytes (UL) in prostate cancer (PCa) risk stratification, with a primary focus on predictive performance and clinical utility.</p>
</sec>
<sec>
<title>Methods</title>
<p>We retrospectively included 492 men with elevated PSA levels from Tongji Hospital (n = 415) and Xiangyang Central Hospital (n = 77). All patients underwent transrectal ultrasound-guided prostate biopsy and were classified into low-, intermediate-, and high-risk PCa according to the Gleason score. Clinical variables, including age, BMI, tPSA, f/tPSA, p2PSA, PHI, PHID, and PSAD, were collected and standardized. Feature selection was performed using least absolute shrinkage and selection operator (LASSO) regression combined with bootstrap-based stability analysis. Based on the selected features, we constructed a non-linear stacking ensemble comprising decision tree, logistic regression, support vector machine (SVM), k-nearest neighbors (KNN), and gradient boosting as base learners. Three-class risk stratification models were trained under two scenarios: with and without incorporation of UL. Model performance was evaluated using the area under the receiver operating characteristic curve (AUC), macro-F1 score, and the DeLong test. Calibration curves and decision curve analysis (DCA) were applied to quantify the incremental net clinical benefit associated with UL. Predefined subgroup analyses across PSA strata (&lt;10, 10&#x2013;20, &gt;20 ng/mL) were conducted to examine the context-dependent contribution of UL.</p>
</sec>
<sec>
<title>Results</title>
<p>In the baseline setting without UL, the non-linear stacking model achieved AUCs of 0.962 and 0.928 in the internal and external cohorts, respectively, indicating robust discriminative performance. After incorporating UL, several base learners&#x2014;particularly decision tree, KNN, and gradient boosting&#x2014;demonstrated center-specific AUC improvements ranging from 0.003 to 0.02 (p &lt; 0.05), accompanied by consistently increased net clinical benefit on DCA. Subgroup analyses showed that the incremental value of UL was most evident in patients with intermediate PSA levels (4&#x2013;10 ng/mL) and in those with clinical features suggestive of benign prostatic hyperplasia. <italic>Post hoc</italic> SHapley Additive exPlanations (SHAP) analyses performed on a representative base learner indicated that UL exerted a modest but directionally consistent influence on high-risk predictions, complementing established PSA-derived indices rather than acting as a dominant independent driver.</p>
</sec>
<sec>
<title>Conclusion</title>
<p>Within a stacking ensemble&#x2013;based risk stratification framework primarily optimized for predictive performance, urinary leukocytes provide a clinically meaningful auxiliary signal that improves discrimination and net benefit in specific PSA-defined subgroups. These findings support the use of UL as a complementary inflammation-related marker in PCa risk assessment, while interpretability is best understood at the level of base learners and original clinical features rather than the full ensemble model.</p>
</sec>
</abstract>
<kwd-group>
<kwd>prostate cancer</kwd>
<kwd>prostate-specific antigen</kwd>
<kwd>risk stratification</kwd>
<kwd>stacking learning</kwd>
<kwd>urinary leukocytes</kwd>
</kwd-group>
<funding-group>
<funding-statement>The author(s) declared that financial support was received for this work and/or its publication. This work was supported by the Hubei key R&amp;D project (2023DJC160), the Medical Artificial Intelligence Fund of Tongji Hospital (AI2024B05) and the Xinjiang Key Laboratory of Artificial Intelligence Assisted Imaging Diagnosis Fund (Grant No. XJRGZN2024008).</funding-statement>
</funding-group>
<counts>
<fig-count count="6"/>
<table-count count="2"/>
<equation-count count="0"/>
<ref-count count="25"/>
<page-count count="13"/>
<word-count count="6705"/>
</counts>
<custom-meta-group>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Genitourinary Oncology</meta-value>
</custom-meta>
</custom-meta-group>
</article-meta>
</front>
<body>
<sec id="s1" sec-type="intro">
<label>1</label>
<title>Introduction</title>
<p>Prostate cancer (PCa) remains one of the most prevalent malignancies among men worldwide and continues to impose a substantial and enduring burden on public health systems (<xref ref-type="bibr" rid="B1">1</xref>). Accurate risk stratification constitutes a pivotal component of contemporary PCa management. Patients with indolent or low-risk disease may be safely managed with active surveillance to avoid overtreatment, whereas those with intermediate- or high-risk disease require timely definitive therapy to mitigate the risks of metastasis and disease-specific mortality. Current clinical guidelines commonly stratify patients into low-, intermediate-, and high-risk groups&#x2014;or more granular subcategories&#x2014;based on prostate-specific antigen (PSA) levels, Gleason score/ISUP grade, and clinical stage. Extensive evidence indicates that such multidimensional risk systems are strongly associated with tumor grade, therapeutic decision pathways, and long-term outcomes, helping reduce unnecessary biopsies and overtreatment while maintaining the detection rate of clinically significant disease (<xref ref-type="bibr" rid="B2">2</xref>&#x2013;<xref ref-type="bibr" rid="B4">4</xref>). In contemporary clinical practice, prostate cancer risk stratification integrates histopathological and imaging-based assessments. The Gleason score, obtained from prostate biopsy, defines tumor aggressiveness and definitive risk categories, whereas PI-RADS provides an MRI-based estimate of lesion suspicion prior to biopsy and guides biopsy indication and targeting.</p>
<p>Despite their clinical utility, conventional risk stratification models face two persistent challenges in real-world settings. First, PSA and its derivative indices lack sufficient specificity; elevations may arise from benign prostatic hyperplasia (BPH), prostatitis, or subclinical inflammation. Second, many existing stratification approaches rely on linear or near-linear assumptions, limiting their ability to capture the nonlinear and interactive relationships among heterogeneous clinical variables, thereby constraining the accuracy of personalized decision-making.</p>
<p>Among various liquid biomarkers, urine has clear advantages&#x2014;noninvasiveness, ease of repeated collection, and anatomical proximity to the prostate. Urine-based assays such as PCA3,TMPRSS2:ERG, and ExoDx Prostate have been successfully developed, building on foundational work by Fujita et&#xa0;al. (<xref ref-type="bibr" rid="B5">5</xref>). In contrast, routine urinalysis parameters&#x2014;particularly urinary leukocytes (UL)&#x2014;have long been overlooked in PCa risk stratification. UL are typically interpreted as markers of urinary tract infection or sterile inflammation (<xref ref-type="bibr" rid="B4">4</xref>). Elevated UL may influence PSA interpretation and prostate volume assessments; however, prior studies have largely regarded UL as a confounder rather than a potentially informative feature (<xref ref-type="bibr" rid="B6">6</xref>). While some evidence suggests an association between sterile pyuria and aberrant PSA elevation (<xref ref-type="bibr" rid="B5">5</xref>), its relationship with biopsy positivity has been inconsistent, implying that inflammatory processes may introduce systematic bias into PSA-based diagnostic reasoning (<xref ref-type="bibr" rid="B7">7</xref>). Within the context of precision medicine, a natural yet unresolved question emerges: if UL are no longer treated as noise but are integrated alongside PSA-derived markers within data-driven models, can they contribute incremental information to enhance PCa risk stratification?</p>
<p>With the rapid adoption of machine learning and deep learning in urologic oncology, numerous models&#x2014;including random forests, support vector machines, gradient boosting machines, neural networks, and radiomics-based classifiers&#x2014;have been proposed for early PCa detection and risk prediction (<xref ref-type="bibr" rid="B8">8</xref>). Many demonstrate superior discriminative performance compared with traditional regression models, and decision curve analyses often show improved net clinical benefit (<xref ref-type="bibr" rid="B2">2</xref>). However, the vast majority of existing studies focus on &#x201c;canonical&#x201d; predictors such as PSA, PHI, PHID, PSAD, and MRI-derived features; routine urinalysis markers have been sparsely explored. To date, no study has explicitly incorporated urinary leukocytes into a multiclass PCa risk stratification model or rigorously assessed their incremental diagnostic value using nonlinear ensemble learning frameworks in multi-center cohorts (<xref ref-type="bibr" rid="B9">9</xref>).</p>
<p>To fill this methodological and clinical gap, we proposed a nonlinear ensemble learning strategy incorporating urinary leukocytes as a candidate predictive feature for three-class PCa risk stratification (<xref ref-type="bibr" rid="B10">10</xref>). Leveraging real-world data from 492 patients across Tongji Hospital and Xiangyang Central Hospital, we applied LASSO with bootstrap stability selection to identify robust predictors and subsequently constructed a nonlinear stacking framework integrating gradient boosting machines, support vector machines, logistic regression, and k-nearest neighbors. Two parallel models&#x2014;without UL and with UL&#x2014;were developed. Using micro-ROC AUC, macro-F1, calibration curves, DeLong tests, and decision curve analysis, we quantified the incremental value of UL and assessed its consistency across PSA subgroups. In addition, SHAP-based model interpretability was employed to characterize nonlinear interactions between UL and key markers such as PSAD and PHI, and to delineate patient-level decision contributions (<xref ref-type="bibr" rid="B11">11</xref>).</p>
<p>This study features several methodological and clinical innovations: (i) to our knowledge, it is the first multicenter analysis to systematically evaluate the additive diagnostic value of routine urinalysis indicators&#x2014;specifically urinary leukocytes&#x2014;in three-class PCa risk stratification; (ii) the nonlinear ensemble learning and multi-metric decision analytic framework better approximates real-world decision boundaries than traditional linear models; and (iii) the interpretability analyses provide mechanistic insights into whether UL should be retained as a cost-effective and clinically meaningful feature within PCa risk models. Collectively, this work offers data-driven evidence to support whether and how UL may be judiciously integrated into contemporary PCa risk assessment workflows.</p>
</sec>
<sec id="s2">
<label>2</label>
<title>Participants and methods</title>
<p>This retrospective study was approved by the Ethics Committee of Tongji Hospital, Tongji Medical College, Huazhong University of Science and Technology (approval No. TJ-IRB202303129), with a waiver of written informed consent. All data were de-identified prior to analysis and used exclusively for research purposes.</p>
<sec id="s2_1">
<label>2.1</label>
<title>Participants</title>
<sec id="s2_1_1">
<label>2.1.1</label>
<title>Patient sources and eligibility criteria</title>
<p>A total of 492 patients were included in this study, comprising 415 cases from Tongji Hospital and 77 cases from Xiangyang Central Hospital. The internal cohort consisted of 415 men with elevated PSA levels who presented to Tongji Hospital between December 2022 and March 2024. The external cohort included men with elevated PSA levels who presented to Xiangyang Central Hospital between April and May 2024. Clinical information and histopathological findings were collected for all participants. Inclusion criteria were as follows: (1) availability of accurate clinical information sufficient for calculating PSA-derived parameters; (2) prostate MRI performed prior to biopsy; (3) MRI quality adequate for Prostate Imaging&#x2013;Reporting and Data System (PI-RADS) scoring. Exclusion criteria were: missing key clinical variables (e.g. PSA level, pathological Gleason score) that could not be retrieved from the medical records, and absence of urinary leukocyte measurements.</p>
</sec>
<sec id="s2_1_2">
<label>2.1.2</label>
<title>Risk stratification</title>
<p>Pathological Gleason score was used to define three risk categories (<xref ref-type="bibr" rid="B12">12</xref>), which served as the three-class labels (low/intermediate/high) for the machine learning models: low-risk, Gleason score &#x2264; 6; intermediate-risk, Gleason score = 7; and high-risk, Gleason score &#x2265; 8.</p>
<p>Training and validation cohorts: Data from Tongji Hospital were used for model development and internal validation. To preserve the overall distribution and the proportion of risk categories, the Tongji cohort was randomly split into a training set and an internal test set at a 7:3 ratio using stratified sampling. Data from Xiangyang Central Hospital were not used for feature selection or model training and were reserved as an independent external validation cohort to assess model generalizability and stability.</p>
</sec>
<sec id="s2_1_3">
<label>2.1.3</label>
<title>Urinary leukocytes assessment</title>
<p>Urinary leukocytes were obtained from routine pre-biopsy urinalysis performed on fresh midstream urine samples as part of standard clinical work-up. Urinalysis was conducted using automated urine analyzers routinely deployed in each participating center, following manufacturers&#x2019; standard operating procedures.</p>
<p>In the present study, UL was treated as a binary variable and defined as positive when leukocyte esterase was reported as &#x2265; trace/&#x201d;+&#x201d; on dipstick urinalysis, and negative otherwise. This threshold corresponds to standard clinical reporting practice and reflects the presence of urinary inflammatory activity rather than a quantitative leukocyte burden.</p>
<p>We did not explore alternative UL cut-offs in the primary analysis, as semi-quantitative dipstick grading (negative, trace, +, ++, +++) is not fully standardized across analyzers and centers. Instead, UL was intentionally modeled as a coarse binary indicator to ensure robustness and clinical generalizability across institutions.</p>
</sec>
</sec>
<sec id="s2_2">
<label>2.2</label>
<title>Clinical characteristics</title>
<p>The clinical and pathological characteristics of patients in the training, internal test and external validation cohorts are summarized in <xref ref-type="table" rid="T1"><bold>Table&#xa0;1</bold></xref>.</p>
<table-wrap id="T1" position="float">
<label>Table&#xa0;1</label>
<caption>
<p>Clinical and pathological characteristics of patients in the retrospective training and test cohorts.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" align="left">Characteristics</th>
<th valign="middle" align="left">Retrospective training and test sets</th>
<th valign="middle" align="left">Retrospective training and test sets</th>
<th valign="middle" align="left">P-Values</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="left">number of patients</td>
<td valign="middle" align="left">415</td>
<td valign="middle" align="left">77</td>
<td valign="middle" align="left"/>
</tr>
<tr>
<td valign="middle" align="left">AGE(years)</td>
<td valign="middle" align="left">66.00 (60.00&#x2013;72.00)</td>
<td valign="middle" align="left">68.00 (61.00&#x2013;72.00)</td>
<td valign="middle" align="left">0.2282</td>
</tr>
<tr>
<td valign="middle" align="left">BMI(kg/m&#xb2;)</td>
<td valign="middle" align="left">23.66 (21.95&#x2013;25.63)</td>
<td valign="middle" align="left">23.70 (21.80&#x2013;25.80)</td>
<td valign="middle" align="left">0.9703</td>
</tr>
<tr>
<td valign="middle" align="left">tPSA(ng/ml) (ng/ml)</td>
<td valign="middle" align="left">9.37 (6.35&#x2013;14.67)</td>
<td valign="middle" align="left">10.28 (6.42&#x2013;15.63)</td>
<td valign="middle" align="left">0.7372</td>
</tr>
<tr>
<td valign="middle" align="left">fPSA(ng/ml)</td>
<td valign="middle" align="left">1.48 (0.98&#x2013;2.25)</td>
<td valign="middle" align="left">1.19 (0.85&#x2013;1.77)</td>
<td valign="middle" align="left">0.0215*</td>
</tr>
<tr>
<td valign="middle" align="left">fPSA/tPSA(ng/ml)</td>
<td valign="middle" align="left">15.75 (10.89&#x2013;22.23)</td>
<td valign="middle" align="left">12.61 (9.10&#x2013;17.05)</td>
<td valign="middle" align="left">&lt;0.001*</td>
</tr>
<tr>
<td valign="middle" align="left">p2PSA(ng/ml)</td>
<td valign="middle" align="left">19.81 (12.82&#x2013;31.77)</td>
<td valign="middle" align="left">18.24 (12.23&#x2013;33.28)</td>
<td valign="middle" align="left">0.8772</td>
</tr>
<tr>
<td valign="middle" align="left">PHI</td>
<td valign="middle" align="left">41.70 (28.00&#x2013;65.45)</td>
<td valign="middle" align="left">49.60 (30.10&#x2013;81.10)</td>
<td valign="middle" align="left">0.0562</td>
</tr>
<tr>
<td valign="middle" align="left">PSAD(ng)</td>
<td valign="middle" align="left">0.20 (0.12&#x2013;0.36)</td>
<td valign="middle" align="left">0.19 (0.13&#x2013;0.40)</td>
<td valign="middle" align="left">0.9708</td>
</tr>
<tr>
<td valign="middle" align="left">PHID</td>
<td valign="middle" align="left">0.86 (0.47&#x2013;1.93)</td>
<td valign="middle" align="left">0.92 (0.52&#x2013;2.47)</td>
<td valign="middle" align="left">0.2677</td>
</tr>
<tr>
<td valign="middle" align="left">Neutrophils(10<sup>^9</sup>/L)</td>
<td valign="middle" align="left">3.41 (2.70&#x2013;4.22)</td>
<td valign="middle" align="left">3.90 (3.18&#x2013;5.32)</td>
<td valign="middle" align="left">0.0013*</td>
</tr>
<tr>
<td valign="middle" align="left">Lymphocytes(10<sup>^9</sup>/L)</td>
<td valign="middle" align="left">1.61 (1.29&#x2013;1.92)</td>
<td valign="middle" align="left">1.48 (1.08&#x2013;1.81)</td>
<td valign="middle" align="left">0.0549</td>
</tr>
<tr>
<td valign="middle" align="left">NLR(10<sup>^9</sup>/L)</td>
<td valign="middle" align="left">2.17 (1.68&#x2013;2.91)</td>
<td valign="middle" align="left">2.87 (1.76&#x2013;4.07)</td>
<td valign="middle" align="left">&lt;0.001*</td>
</tr>
<tr>
<td valign="middle" align="left">Volume(mL)</td>
<td valign="middle" align="left">46.44 (30.51&#x2013;66.04)</td>
<td valign="middle" align="left">44.60 (31.20&#x2013;72.20)</td>
<td valign="middle" align="left">0.8645</td>
</tr>
<tr>
<th valign="middle" align="left">Gleason Score, n (%)</th>
<th valign="middle" align="left"/>
<th valign="middle" align="left"/>
<th valign="middle" align="left"/>
</tr>
<tr>
<td valign="middle" align="left">&#x2003;Benign</td>
<td valign="middle" align="left">270 (65.1%)</td>
<td valign="middle" align="left">47 (61.0%)</td>
<td valign="middle" align="left"/>
</tr>
<tr>
<td valign="middle" align="left">&#x2003;Intermediate</td>
<td valign="middle" align="left">105 (25.3%)</td>
<td valign="middle" align="left">20 (26.0%)</td>
<td valign="middle" align="left"/>
</tr>
<tr>
<td valign="middle" align="left">&#x2003;High</td>
<td valign="middle" align="left">40 (9.6%)</td>
<td valign="middle" align="left">10 (13.0%)</td>
<td valign="middle" align="left"/>
</tr>
<tr>
<td valign="middle" align="left">Smoking history, n (%)</td>
<td valign="middle" align="left"/>
<td valign="middle" align="left"/>
<td valign="middle" align="left">0.1546</td>
</tr>
<tr>
<td valign="middle" align="left">0</td>
<td valign="middle" align="left">302 (72.8%)</td>
<td valign="middle" align="left">62 (80.5%)</td>
<td valign="middle" align="left"/>
</tr>
<tr>
<td valign="middle" align="left">1</td>
<td valign="middle" align="left">113 (27.2%)</td>
<td valign="middle" align="left">15 (19.5%)</td>
<td valign="middle" align="left"/>
</tr>
<tr>
<td valign="middle" align="left">urinary leukocytes, n (%)</td>
<td valign="middle" align="left"/>
<td valign="middle" align="left"/>
<td valign="middle" align="left">0.0612</td>
</tr>
<tr>
<td valign="middle" align="left">0</td>
<td valign="middle" align="left">299 (72.6%)</td>
<td valign="middle" align="left">65 (84.4%)</td>
<td valign="middle" align="left"/>
</tr>
<tr>
<td valign="middle" align="left">1</td>
<td valign="middle" align="left">113 (27.4%)</td>
<td valign="middle" align="left">12 (15.6%)</td>
<td valign="middle" align="left"/>
</tr>
<tr>
<td valign="middle" align="left">PIRADS, n (%)</td>
<td valign="middle" align="left"/>
<td valign="middle" align="left"/>
<td valign="middle" align="left">0.7457</td>
</tr>
<tr>
<td valign="middle" align="left">1</td>
<td valign="middle" align="left">8 (1.9%)</td>
<td valign="middle" align="left">0 (0.0%)</td>
<td valign="middle" align="left"/>
</tr>
<tr>
<td valign="middle" align="left">2</td>
<td valign="middle" align="left">86 (20.7%)</td>
<td valign="middle" align="left">14 (18.2%)</td>
<td valign="middle" align="left"/>
</tr>
<tr>
<td valign="middle" align="left">3</td>
<td valign="middle" align="left">157 (37.8%)</td>
<td valign="middle" align="left">30 (39.0%)</td>
<td valign="middle" align="left"/>
</tr>
<tr>
<td valign="middle" align="left">4</td>
<td valign="middle" align="left">83 (20.0%)</td>
<td valign="middle" align="left">16 (20.8%)</td>
<td valign="middle" align="left"/>
</tr>
<tr>
<td valign="middle" align="left">5</td>
<td valign="middle" align="left">81 (19.5%)</td>
<td valign="middle" align="left">17 (22.1%)</td>
<td valign="middle" align="left"/>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>*indicates a statistically significant difference.</p></fn>
</table-wrap-foot>
</table-wrap>
</sec>
<sec id="s2_3">
<label>2.3</label>
<title>Study pipeline</title>
<sec id="s2_3_1">
<label>2.3.1</label>
<title>Overall workflow and modeling framework</title>
<p>The overall study workflow and modeling pipeline are schematically illustrated in <xref ref-type="fig" rid="f1"><bold>Figure&#xa0;1</bold></xref>.</p>
<fig id="f1" position="float">
<label>Figure&#xa0;1</label>
<caption>
<p>Flowchart of data screening and cohort allocation. <bold>(a)</bold> Internal dataset; <bold>(b)</bold> External validation dataset.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-16-1762494-g001.tif">
<alt-text content-type="machine-generated">Flowchart with two panels showing patient selection for prostate cancer model development and validation. Panel a: Out of 443 patients at Tongji Hospital, 415 included after exclusions; Gleason scores distributed as less than 7 in 270 patients, equal to 7 in 105 patients, and greater than 7 in 40 patients. Panel b: Out of 108 patients at Xiangyang Central Hospital, 77 included after exclusions; Gleason scores less than 7 in 47 patients, equal to 7 in 20 patients, and greater than 7 in 10 patients.</alt-text>
</graphic></fig>
</sec>
<sec id="s2_3_2">
<label>2.3.2</label>
<title>Feature engineering and variable selection</title>
<p>To fully capture potential nonlinear relationships between prostate-related indices and tumor risk, while controlling the risk of overfitting in a high-dimensional feature space, we performed systematic feature engineering and regularized variable selection prior to model development.</p>
<p>Based on prior literature and clinical expertise, we first identified a predefined set of baseline clinical and biochemical variables, including age, body mass index (BMI), total PSA (tPSA), free-to-total PSA ratio (f/tPSA), p2PSA, Prostate Health Index (PHI), PHI density (PHID), PSA density (PSAD), PI-RADS score, prostate volume, and Lymphocytes cell counts. PHI and p2PSA have been shown in multicenter cohorts and systematic reviews to significantly improve discrimination of clinically significant PCa beyond conventional tPSA, with superior AUC and decision-curve performance compared with PSA-only models (<xref ref-type="bibr" rid="B13">13</xref>). PSAD and PHID have been repeatedly validated as important parameters for identifying high-risk lesions and reducing unnecessary biopsies, whereas PI-RADS v2/v2.1 has become a standardized tool for mpMRI-based assessment of suspicious lesions and their correspondence with Gleason grading (<xref ref-type="bibr" rid="B14">14</xref>). Collectively, these data support using the above variables as the core feature set for model construction and extension in the present study.</p>
<p>Given that these indices typically exhibit skewed distributions, threshold effects and saturation effects, we predefined, using only the internal training set, a library of statistically plausible nonlinear&#xa0;transformations for each candidate variable (<xref ref-type="bibr" rid="B15">15</xref>). These&#xa0;transformations included, but were not limited to, logarithm&#xa0;(log), square root (sqrt), reciprocal, square, hyperbolic tangent&#xa0;(tanh), sigmoid, tangent (tan), and simple sinusoidal transformations (sin/cos). Importantly, these transformations were not intended to represent explicit physiological mechanisms for each variable; rather, they serve as generic nonlinear basis functions that allow the models to capture complex, potentially non-monotonic relationships in a data-driven manner. All transformations were specified <italic>a priori</italic>, and the same rules were applied uniformly across variables to generate an expanded feature set, thereby constructing a rich yet interpretable candidate feature space rather than performing outcome-driven, <italic>post hoc</italic> feature engineering (<xref ref-type="fig" rid="f2"><bold>Figure&#xa0;2a</bold></xref>).</p>
<fig id="f2" position="float">
<label>Figure&#xa0;2</label>
<caption>
<p>Nonlinear feature selection using multiclass LASSO. <bold>(a)</bold> coefficient paths of candidate nonlinear features as a function of &#x3bb; (= 1/C). As &#x3bb; increases, model sparsity increases and weak predictors are progressively eliminated. <bold>(b)</bold> 5-fold cross-validated multiclass log-loss as a function of &#x3bb;. The dashed line indicates the selected &#x3bb;, which lies within the near-optimal performance region while yielding a sparse feature set comprising 17 stable predictors.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-16-1762494-g002.tif">
<alt-text content-type="machine-generated">Two-panel data visualization comparing regularization effects in model coefficients and cross-validated log-loss. Panel a, a line plot titled &#x201c;Coefficient Paths,&#x201d; shows mean absolute coefficient values for different features as functions of lambda (inverse C), with numerous colored lines labeled in the legend. Panel b, a line plot &#x201c;CV log-loss vs lambda,&#x201d; depicts cross-validated log-loss on the y-axis for increasing lambda, showing a U-shaped pattern with error bars, indicating minimum loss around lambda equals ten. Both panels use logarithmic x-axes and include a vertical dashed line at lambda equals ten.</alt-text>
</graphic></fig>
<p>After nonlinear expansion, we applied L1-regularized multinomial logistic regression (least absolute shrinkage and selection operator, LASSO) for feature selection (<xref ref-type="bibr" rid="B16">16</xref>). By introducing an L1 penalty term into the loss function, LASSO shrinks coefficients of non-informative or highly redundant features exactly to zero, thus achieving parameter estimation and dimensionality reduction within a single framework. This approach is particularly suited to medical datasets in which the number of features approaches or exceeds the sample size (<xref ref-type="bibr" rid="B17">17</xref>). The regularization parameter &#x3bb; was chosen on the internal training set via K-fold cross-validation, with the average multinomial log-loss used as the optimization criterion. As illustrated in <xref ref-type="fig" rid="f2"><bold>Figure&#xa0;2b</bold></xref>, the cross-validated log-loss reached its minimum at an optimal &#x3bb; (dashed vertical line), reflecting the best trade-off between predictive accuracy and model sparsity. This data-driven selection ensured that only the most informative nonlinear features were retained while reducing the risk of overfitting.</p>
<p>To assess the stability of variable selection, we employed a resampling strategy (bootstrap or repeated cross-validation) within the training set, refitting the LASSO model in each resampled dataset (<xref ref-type="bibr" rid="B18">18</xref>) and recording the selection frequency of every candidate feature. Only features that were consistently selected in the majority of resampling iterations were retained as the final modeling feature set. These features were then used to train the subsequent nonlinear machine learning models (gradient boosting,&#xa0;support vector machine, logistic regression, k-nearest neighbors, etc.) under two scenarios: without UL and with UL. This pipeline ensured reproducible and interpretable feature engineering while minimizing the influence of stochastic noise on model construction.</p>
</sec>
<sec id="s2_3_3">
<label>2.3.3</label>
<title>Ensemble learning strategy</title>
<p>We first trained and evaluated more than ten commonly used machine learning algorithms on the training cohort using 5-fold cross-validation, including logistic regression (Logistic Regression), support vector machine (SVM), k-nearest neighbors (kNN), decision tree (Decision Tree), random forest (Random Forest, RF), gradient boosting decision tree (Gradient Boosting), extreme gradient boosting (XGBoost), Light Gradient Boosting Machine (LightGBM), na&#xef;ve Bayes (Naive Bayes) and multilayer perceptron (MLP). Hyperparameters for each model were tuned by grid search, an exhaustive procedure that iterates over all predefined combinations within a hyperparameter grid, trains and evaluates each configuration, and selects the one achieving the best cross-validated performance on the validation folds (<xref ref-type="bibr" rid="B19">19</xref>).</p>
<p>We then designed an ensemble learning strategy tailored for PCa risk stratification and multi-class classification. The five best-performing base learners were selected according to their cross-validated performance. For these five models, hyperparameters were further optimized using grid search combined with 5-fold cross-validation, and the models were trained and fine-tuned on the retrospective cohorts, yielding a set of high-performing and mutually complementary base classifiers that underpin the subsequent ensemble schemes. Two ensemble approaches were constructed and compared: voting and stacking (<xref ref-type="bibr" rid="B20">20</xref>, <xref ref-type="bibr" rid="B21">21</xref>). In the voting ensemble, we implemented an equal-weight soft-voting scheme, in which the class probabilities output by the five probability-calibrated base models were averaged without weighting to obtain the final prediction (<xref ref-type="bibr" rid="B22">22</xref>). In the stacking ensemble, we adopted a two-layer architecture. The first layer consisted of the same five base models; using 5-fold cross-validation on the training set, we obtained out-of-fold class probability predictions for each model, and concatenated these multi-class probability vectors to form a new set of meta-features. The second layer employed L2-regularized logistic regression as the meta-learner (<xref ref-type="bibr" rid="B23">23</xref>), which learns an optimal linear combination of the base-model outputs without information leakage. This design allows automatic estimation of the contribution (weights) of each base learner and aims to further improve overall predictive performance. All ensembles were constructed and evaluated under two scenarios&#x2014;without UL and with UL&#x2014;to quantify the incremental value of urinary leukocytes for PCa risk stratification.</p>
</sec>
<sec id="s2_3_4">
<label>2.3.4</label>
<title>Statistical analysis</title>
<p>Continuous variables (<xref ref-type="table" rid="T2"><bold>Table&#xa0;2</bold></xref>) are summarized as median and interquartile range (IQR) and were compared between groups using the Mann&#x2013;Whitney U test. Categorical variables are presented as counts and percentages and were compared using the &#x3c7;&#xb2; test. All statistical tests were two-sided, and a P value &lt; 0.05 was considered statistically significant.</p>
<table-wrap id="T2" position="float">
<label>Table&#xa0;2</label>
<caption>
<p>Performance of multiple models on the internal test set and external validation cohort.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" align="left">Dataset</th>
<th valign="middle" align="left">Model</th>
<th valign="middle" align="left">AUC (95%CI)</th>
<th valign="middle" align="left">Accuracy</th>
<th valign="middle" align="left">MacroF1</th>
<th valign="middle" align="left">MacroPPV</th>
<th valign="middle" align="left">MacroNPV</th>
<th valign="middle" align="left">Pos2_ Sensitivity</th>
<th valign="middle" align="left">Pos2_ Specificity</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" rowspan="7" align="left"><bold><italic>Internal</italic></bold></td>
<td valign="middle" align="left">Decision<break/>Tree</td>
<td valign="middle" align="left">0.927 (0.898-0.954)</td>
<td valign="middle" align="left">0.81</td>
<td valign="middle" align="left">0.60</td>
<td valign="middle" align="left">0.83</td>
<td valign="middle" align="left">0.90</td>
<td valign="middle" align="left">0.13</td>
<td valign="middle" align="left">1</td>
</tr>
<tr>
<td valign="middle" align="left">Gradient<break/>Boosting</td>
<td valign="middle" align="left">0.947 (0.912-0.976)</td>
<td valign="middle" align="left">0.84</td>
<td valign="middle" align="left"><bold>0.70</bold></td>
<td valign="middle" align="left">0.74</td>
<td valign="middle" align="left">0.93</td>
<td valign="middle" align="left">0.38</td>
<td valign="middle" align="left">0.97</td>
</tr>
<tr>
<td valign="middle" align="left">KNN</td>
<td valign="middle" align="left">0.936 (0.903-0.968)</td>
<td valign="middle" align="left">0.83</td>
<td valign="middle" align="left">0.69</td>
<td valign="middle" align="left">0.74</td>
<td valign="middle" align="left">0.92</td>
<td valign="middle" align="left">0.38</td>
<td valign="middle" align="left">0.97</td>
</tr>
<tr>
<td valign="middle" align="left">Logistic<break/>Regression</td>
<td valign="middle" align="left">0.952 (0.934-0.970)</td>
<td valign="middle" align="left">0.81</td>
<td valign="middle" align="left">0.66</td>
<td valign="middle" align="left">0.75</td>
<td valign="middle" align="left">0.93</td>
<td valign="middle" align="left">0.38</td>
<td valign="middle" align="left">0.99</td>
</tr>
<tr>
<td valign="middle" align="left">SVM</td>
<td valign="middle" align="left">0.949 (0.920-0.972)</td>
<td valign="middle" align="left">0.81</td>
<td valign="middle" align="left">0.67</td>
<td valign="middle" align="left">0.71</td>
<td valign="middle" align="left">0.92</td>
<td valign="middle" align="left"><bold>0.88</bold></td>
<td valign="middle" align="left">0.88</td>
</tr>
<tr>
<td valign="middle" align="left">Stacking</td>
<td valign="middle" align="left"><bold>0.962 (0.936-0.983)</bold></td>
<td valign="middle" align="left"><bold>0.86</bold></td>
<td valign="middle" align="left">0.69</td>
<td valign="middle" align="left"><bold>0.87</bold></td>
<td valign="middle" align="left"><bold>0.94</bold></td>
<td valign="middle" align="left">0.25</td>
<td valign="middle" align="left"><bold>1</bold></td>
</tr>
<tr>
<td valign="middle" align="left">Voting</td>
<td valign="middle" align="left">0.956 (0.930-0.978)</td>
<td valign="middle" align="left">0.84</td>
<td valign="middle" align="left">0.67</td>
<td valign="middle" align="left">0.86</td>
<td valign="middle" align="left"><bold>0.94</bold></td>
<td valign="middle" align="left">0.25</td>
<td valign="middle" align="left"><bold>1</bold></td>
</tr>
<tr>
<td valign="middle" rowspan="7" align="left"><bold><italic>External</italic></bold></td>
<td valign="middle" align="left">Decision<break/>Tree</td>
<td valign="middle" align="left">0.925 (0.897-0.951)</td>
<td valign="middle" align="left">0.77</td>
<td valign="middle" align="left">0.61</td>
<td valign="middle" align="left">0.80</td>
<td valign="middle" align="left">0.88</td>
<td valign="middle" align="left">0.20</td>
<td valign="middle" align="left"><bold>1</bold></td>
</tr>
<tr>
<td valign="middle" align="left">Gradient<break/>Boosting</td>
<td valign="middle" align="left">0.920 (0.878-0.953)</td>
<td valign="middle" align="left">0.75</td>
<td valign="middle" align="left">0.64</td>
<td valign="middle" align="left">0.70</td>
<td valign="middle" align="left">0.88</td>
<td valign="middle" align="left">0.50</td>
<td valign="middle" align="left">0.97</td>
</tr>
<tr>
<td valign="middle" align="left">KNN</td>
<td valign="middle" align="left">0.884 (0.839-0.923)</td>
<td valign="middle" align="left">0.70</td>
<td valign="middle" align="left">0.55</td>
<td valign="middle" align="left">0.59</td>
<td valign="middle" align="left">0.84</td>
<td valign="middle" align="left">0.30</td>
<td valign="middle" align="left">0.96</td>
</tr>
<tr>
<td valign="middle" align="left">Logistic<break/>Regression</td>
<td valign="middle" align="left">0.913 (0.880-0.944)</td>
<td valign="middle" align="left"><bold>0.78</bold></td>
<td valign="middle" align="left"><bold>0.67</bold></td>
<td valign="middle" align="left">0.73</td>
<td valign="middle" align="left"><bold>0.92</bold></td>
<td valign="middle" align="left">0.60</td>
<td valign="middle" align="left">0.97</td>
</tr>
<tr>
<td valign="middle" align="left">SVM</td>
<td valign="middle" align="left">0.921 (0.882-0.956)</td>
<td valign="middle" align="left">0.75</td>
<td valign="middle" align="left"><bold>0.67</bold></td>
<td valign="middle" align="left">0.66</td>
<td valign="middle" align="left">0.87</td>
<td valign="middle" align="left"><bold>0.80</bold></td>
<td valign="middle" align="left">0.87</td>
</tr>
<tr>
<td valign="middle" align="left">Stacking</td>
<td valign="middle" align="left"><bold>0.928 (0.897-0.954)</bold></td>
<td valign="middle" align="left">0.73</td>
<td valign="middle" align="left">0.52</td>
<td valign="middle" align="left">0.54</td>
<td valign="middle" align="left">0.87</td>
<td valign="middle" align="left">0.10</td>
<td valign="middle" align="left">0.96</td>
</tr>
<tr>
<td valign="middle" align="left">Voting</td>
<td valign="middle" align="left">0.927 (0.895-0.955)</td>
<td valign="middle" align="left">0.75</td>
<td valign="middle" align="left">0.58</td>
<td valign="middle" align="left">0.68</td>
<td valign="middle" align="left">0.89</td>
<td valign="middle" align="left">0.20</td>
<td valign="middle" align="left">0.99</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>(Pos2_* denotes performance metrics calculated with class 2 as the positive class; in this study, class 2 corresponds to the high-risk group. Bold values indicate the best-performing model for each metric within the corresponding dataset).</p></fn>
</table-wrap-foot>
</table-wrap>
<p>All statistical analyses and model development were performed in Python 3.11.11. Classical statistical tests and P value calculations were conducted using the SciPy library (two-sided tests with a significance level &#x3b1; = 0.05). Machine learning models were implemented with scikit-learn for model orchestration and pre-processing. For tree-based models, XGBoost (version 3.0.1) and LightGBM (version 4.6.0) were integrated through their respective scikit-learn compatible APIs. Specifically, XGBoost was used via the XGBClassifier from the xgboost library, and LightGBM was used via the LGBMClassifier from the lightgbm library. Other models, including RandomForest, DecisionTree, LogisticRegression, SVM, and KNN, were directly implemented using scikit-learn. Model interpretability analyses were carried out using the shap library (SHapley Additive exPlanations). Figures and graphical summaries were generated using matplotlib and seaborn. To enhance reproducibility, random seeds were fixed across all training and evaluation procedures.</p>
<p>Model performance was quantified using several metrics, including the area under the receiver operating characteristic curve (AUC), sensitivity, specificity and macro-averaged F1 score (macro-F1) (<xref ref-type="bibr" rid="B24">24</xref>). Sensitivity measures the ability of the model to correctly identify positive cases, whereas specificity measures its ability to correctly identify negative cases. The F1 score, defined as the harmonic mean of precision and recall, provides a composite measure that jointly accounts for false positives and false negatives&#xa0;and is particularly suitable for imbalanced multi-class classification (<xref ref-type="bibr" rid="B25">25</xref>).</p>
</sec>
</sec>
</sec>
<sec id="s3" sec-type="results">
<label>3</label>
<title>Results</title>
<sec id="s3_1">
<label>3.1</label>
<title>Overall performance evaluation</title>
<p>Among all candidate algorithms, the five best-performing base learners were gradient boosting, support vector machine (SVM), logistic regression, k-nearest neighbors (KNN) and decision tree. <xref ref-type="fig" rid="f3"><bold>Figure&#xa0;3</bold></xref> depicts the micro-averaged ROC curves of these models, and the corresponding quantitative results are summarized in <xref ref-type="table" rid="T2"><bold>Table&#xa0;2</bold></xref>. At the single-model level, all classifiers already achieved high discriminative performance, with AUCs ranging from 0.927 to 0.952; logistic regression yielded the highest AUC of 0.952 (95% CI, 0.934&#x2013;0.970). On top of this strong baseline, the ensemble strategies further improved overall performance: the stacking ensemble achieved an AUC of 0.962 (95% CI, 0.936&#x2013;0.983), and the voting ensemble achieved an AUC of 0.956 (95% CI, 0.930&#x2013;0.978), both outperforming any individual base learner. Stacking also showed slightly higher accuracy (0.86 vs. 0.84) and macro-averaged F1 score (0.69 vs. 0.67) compared with voting. Macro-averaged PPV (0.86&#x2013;0.87) and macro-averaged NPV (both 0.94), together with specificities approaching 1.000, indicated good negative-class recognition and overall stability for both ensembles. When high-risk PCa (Pos2) was treated as the positive class, SVM as a single model achieved the highest sensitivity (0.88), whereas the stacking and voting ensembles exhibited lower sensitivity for Pos2 (0.25 at the default decision threshold), reflecting a more conservative decision profile that prioritizes reduction of false positives.</p>
<fig id="f3" position="float">
<label>Figure&#xa0;3</label>
<caption>
<p>Micro-averaged ROC curves of multiple models in the internal test set and external validation cohort.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-16-1762494-g003.tif">
<alt-text content-type="machine-generated">Side-by-side ROC curve charts compare the performance of multiple classifiers on internal data (left panel) and external data (right panel), using dashed lines for models without UL and solid lines for models with UL. Each chart includes an inset zoomed on low false positive rates. Legends detail classifier types, AUC values, and confidence intervals. Both charts use true positive rate versus false positive rate axes.</alt-text>
</graphic></fig>
<p>External validation in the independent cohort showed that all models maintained good discrimination, with AUCs ranging from 0.884 to 0.928. The stacking and voting ensembles again performed slightly better than most single models, with AUCs of 0.928 (95% CI, 0.897&#x2013;0.954) and 0.927 (95% CI, 0.895&#x2013;0.955), respectively, compared with, for example, decision tree (AUC = 0.925), logistic regression (AUC = 0.913) and SVM (AUC = 0.921). In the external cohort, voting showed a modest advantage in terms of overall accuracy (0.75) and specificity (0.99), whereas stacking provided a more balanced trade-off between sensitivity and specificity, and between PPV and NPV, across clinically relevant decision thresholds (<xref ref-type="table" rid="T2"><bold>Table&#xa0;2</bold></xref>; <xref ref-type="fig" rid="f3"><bold>Figure&#xa0;3</bold></xref>).</p>
<p>Taken together, the ensemble learning strategies enhanced the overall discriminative ability and robustness of PCa risk stratification beyond what was achievable with individual models alone. Among them, stacking appears more suitable when the primary objective is to maximize predictive performance and net clinical benefit, whereas voting&#x2014;characterized by a simpler structure and consistently high specificity and NPV&#x2014;offers an attractive and operationally straightforward option for clinical implementation.</p>
</sec>
<sec id="s3_2">
<label>3.2</label>
<title>Diagnostic value of UL for PCa risk stratification</title>
<p>To systematically quantify the incremental diagnostic value conferred by UL, we evaluated both calibration and clinical decision-analytic performance before and after incorporating UL into the models. Calibration was assessed using the multiclass Brier score and stratified calibration plots to examine the agreement between predicted probabilities and observed risks, and to compare the extent of calibration improvement after adding UL. Clinical utility was evaluated using decision curve analysis (DCA), which estimates the net benefit across a range of threshold probabilities (PT). We further computed &#x394;NB and &#x394;TP/&#x394;FP per 100 patients to visually illustrate the impact of UL on key clinical decisions (e.g., whether to perform biopsy or escalate management).</p>
</sec>
<sec id="s3_3">
<label>3.3</label>
<title>Clinical applicability of UL for PCa risk stratification</title>
<p>As shown in <xref ref-type="fig" rid="f4"><bold>Figures&#xa0;4a&#x2013;f</bold></xref>, incorporation of UL led to a consistent improvement in calibration performance in both the internal and external cohorts. In the internal dataset, the multiclass Brier score decreased after adding UL (e.g. from 0.216 to 0.210 for stacking, from 0.257 to 0.247 for voting, and from 0.256 to 0.242 for gradient boosting), indicating better agreement between predicted probabilities and observed risks. Stratified calibration curves further demonstrated that the with UL models (solid lines) were generally closer to the 45&#xb0; identity line than their without UL counterparts (dashed lines), suggesting a reduction in over- or underestimation, particularly in the high-risk probability range.</p>
<fig id="f4" position="float">
<label>Figure&#xa0;4</label>
<caption>
<p>Discrimination, calibration, and clinical utility of models with and without urinary leukocytes (UL). <bold>(a, b)</bold> Calibration curves for the internal cohort <bold>(a)</bold> and external cohort <bold>(b)</bold>. Solid lines indicate models with UL; dashed lines indicate models without UL. <bold>(c, d)</bold> Differences in net benefit (&#x394;NB) between models with and without UL in the internal <bold>(c)</bold> and external <bold>(d)</bold> cohorts. <bold>(e, f)</bold> Decision curve analysis showing net benefit across a range of threshold probabilities for models with and without UL.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-16-1762494-g004.tif">
<alt-text content-type="machine-generated">Six-panel figure showing various calibration, net benefit, and decision curve analyses comparing machine learning models with and without uncertainty layers (UL) on internal and external data. Panel a and b display line calibration curves (internal and external) for multiple algorithms, with solid lines for with UL and dashed for without. Panel c and d plot delta net benefit across threshold probabilities for selected models, contrasting with and without UL. Panel e and f show decision curves (internal and external), depicting net benefit by threshold probability, with insets for detailed lower ranges, comparing model performance under both conditions.</alt-text>
</graphic></fig>
<p>Decision curve analysis (DCA) provided complementary evidence at the clinical decision level. Within clinically relevant threshold probability ranges (PT &#x2248; 0.05&#x2013;0.30), the with UL curves for all models lay above both the without UL curves and the &#x201c;treat-all&#x201d;/&#x201d;treat-none&#x201d; strategies. Among them, the stacking and voting ensembles yielded the highest net benefit, with peak &#x394;NB values of approximately 0.03&#x2013;0.04 in the internal cohort, corresponding to an increase of about 2&#x2013;4 correctly identified high-risk patients per 100 individuals (&#x394;TP &#x2248; 2&#x2013;4/100 patients), without a substantial increase in false positives. In the external validation cohort, the absolute magnitude of &#x394;NB was somewhat smaller (on the order of 0.01&#x2013;0.02) and more variable, but the overall pattern remained consistent, with UL models providing higher net benefit across a broad range of decision thresholds.</p>
<p>Taken together, these findings indicate that incorporating UL improves probability calibration and net clinical benefit for PCa risk stratification, while not materially increasing the risk of false positives. The incremental gain is stable across different PSA ranges and is particularly pronounced for ensemble models such as stacking and voting, supporting the role of UL as an independent, quantifiable biomarker with added diagnostic value in PCa risk prediction.</p>
</sec>
<sec id="s3_4">
<label>3.4</label>
<title>PSA-based subgroup analysis</title>
<p>To investigate whether the incremental value of UL varies across different levels of tumor burden, we performed a pre-specified subgroup analysis stratified by baseline PSA. In the internal test set (<xref ref-type="fig" rid="f5"><bold>Figures&#xa0;5a, c, e</bold></xref>), all models maintained high discriminative ability within the PSA 4&#x2013;10 and 10&#x2013;20 ng/mL strata, with micro-averaged AUCs clustering around 0.93. Upon incorporation of UL, none of the models showed performance deterioration in any subgroup; instead, the ROC curves shifted slightly towards the upper left. In the PSA 4&#x2013;10 ng/mL subgroup, the absolute micro-AUC gains attributable to UL were modest but directionally consistent across model families&#x2014;tree-based, linear and ensemble learners&#x2014;with &#x394;AUC values largely confined to a narrow range of 0.002&#x2013;0.005, suggesting a small yet robust incremental signal at low-to-intermediate PSA levels. In the PSA 10&#x2013;20 ng/mL subgroup, the magnitude of AUC improvement was further attenuated, and &#x394;AUC varied slightly across algorithms, but changes remained predominantly small and positive with no evidence of systematic degradation. For the PSA &gt;20 ng/mL subgroup, baseline micro-AUCs ranged from approximately 0.82 to 0.89; after adding UL, most models (particularly SVM, KNN and the Voting/Stacking ensembles) exhibited AUC increases of about 0.01&#x2013;0.02, whereas Gradient Boosting and Logistic Regression were essentially unchanged, indicating that the contribution of UL in the high-PSA setting is more uncertain but, overall, unlikely to behave as pure noise.</p>
<fig id="f5" position="float">
<label>Figure&#xa0;5</label>
<caption>
<p>Micro-ROC curves of models with and without urinary leukocytes (UL) across baseline PSA subgroups. <bold>(a, b)</bold> Results for PSA 4&#x2013;10 ng/mL; <bold>(c, d)</bold> results for PSA 10&#x2013;20 ng/mL; <bold>(e, f)</bold> results for PSA &gt;20 ng/mL. Solid lines denote models incorporating UL, whereas dashed lines denote the corresponding models without UL.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-16-1762494-g005.tif">
<alt-text content-type="machine-generated">Six-panel figure with receiver operating characteristic (ROC) curves for multiple machine learning models predicting outcomes based on PSA levels. Panels a, c, and e show internal test results for PSA subgroups: less than ten, ten to twenty, and greater than twenty, respectively. Panels b, d, and f show corresponding external test results. Each panel plots true positive rate versus false positive rate for five models: gradient boosting, logistic regression, support vector machine, voting, and stacking, with area under the curve (AUC) metrics in the legend. Insets provide a zoomed view of the lower left corner.</alt-text>
</graphic></fig>
<p>Findings in the external validation cohort were broadly concordant with those of the internal cohort, albeit with greater variability (<xref ref-type="fig" rid="f5"><bold>Figures&#xa0;5b, d, f</bold></xref>). Among patients with PSA 4&#x2013;10 ng/mL, micro-AUCs for all models were consistently slightly higher after incorporating UL than for their respective baselines, with &#x394;AUC pointing in the same (favorable) direction, supporting the reproducibility of UL-related gains in the low-PSA range in an independent dataset. In the PSA 10&#x2013;20 ng/mL subgroup, AUC differences largely fluctuated around zero, with only minor positive or negative deviations in individual models, indicating that the overall benefit approaches a marginal effect. In the PSA &gt;20 ng/mL subgroup, where sample size was smaller and class imbalance more pronounced, &#x394;AUC values across algorithms included small positive shifts as well as values close to zero or slightly negative, and the ROC curves were visibly stepwise, underscoring limited estimation precision and an exploratory rather than definitive nature of the evidence in this range.</p>
<p>Taken together, UL did not compromise the discriminative performance of any model across PSA strata and provided a small but consistent incremental discriminative benefit within the PSA 4&#x2013;20 ng/mL interval, with the clearest and most reproducible gains observed in the PSA 4&#x2013;10 ng/mL low-to-intermediate PSA population. For patients with PSA &gt;20 ng/mL, the direction of UL&#x2019;s effect appears broadly non-negative in the current data, but given sample size constraints and unstable ROC estimation, conclusions in this high-PSA subgroup should be interpreted cautiously and confirmed in larger, multi-center cohorts.</p>
</sec>
<sec id="s3_5">
<label>3.5</label>
<title>SHAP-based interpretability analysis</title>
<p>SHAP analyses were conducted using the TreeExplainer, which is optimized for tree-based models, applied to the gradient boosting classifier. The internal training cohort was used as the background reference distribution. SHAP values were computed in a one-vs-rest framework for the high-risk class (class 2), such that positive values indicate increased predicted probability of high-risk PCa and negative values indicate a down-weighting effect. This formulation facilitates direct interpretation of feature contributions to clinically significant disease risk.</p>
<p>Using the internal test set, we computed SHAP values for the gradient boosting model including urinary leukocytes (UL), focusing on predictions for high-risk prostate cancer (class 2), in order to dissect the contribution of individual features to the model output. Global feature importance ranked by mean absolute SHAP value showed that nonlinearly transformed PSA-related indices and MRI-derived features (e.g. BMI:Sine, PHID:Tanh, PHID:Sigmoid, PHI, and PSAD:Tangent) were the principal drivers of high-risk predictions. In contrast, urinary leukocytes contributed more modestly, ranking in the lower tier of all features but exhibiting a small yet consistent impact (<xref ref-type="fig" rid="f6"><bold>Figure&#xa0;6b</bold></xref>). This pattern is consistent with the intended role of UL as an inflammation-related contextual marker designed to complement, rather than replace, conventional quantitative risk indicators.</p>
<fig id="f6" position="float">
<label>Figure&#xa0;6</label>
<caption>
<p>SHAP-based interpretation of the gradient boosting model including urinary leukocytes (UL) for predicting high-risk prostate cancer (class 2). <bold>(a)</bold> Univariate SHAP dependence plot for UL, showing that SHAP values are predominantly mildly negative in UL-positive cases, indicating a down-weighting effect on high-risk predictions. <bold>(b)</bold> Global feature importance ranked by mean absolute SHAP values for class 2 predictions, demonstrating that PSA-related indices and MRI-derived features dominate model output, while UL contributes modest but non-zero information. <bold>(c)</bold> Paired waterfall plots for a representative case (sample #14), comparing the model without UL <bold>(c)</bold> and with UL <bold>(d)</bold>. This example illustrates that the inclusion of UL does not directly increase high-risk probability, but instead reshapes the contribution of other predictors by distinguishing inflammation-related from non-inflammatory PSA elevations, allowing high-risk patterns to be more clearly expressed in UL-negative cases. The x-axes of SHAP dependence plots reflect transformed feature values used for model training rather than raw clinical measurements.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-16-1762494-g006.tif">
<alt-text content-type="machine-generated">Panel a displays a scatter plot showing SHAP values for urinary leukocytes, with most values clustering near one and a color gradient bar for feature contribution. Panel b shows two horizontal bar graphs comparing feature importance without and with urinary leukocytes in the model, including metrics such as PSAD and p2PSA. Panels c and d are beeswarm plots illustrating SHAP value distributions for various features, comparing models excluding (c) and including (d) urinary leukocytes, with feature values color-coded from low (blue) to high (red).</alt-text>
</graphic></fig>
<p>Univariate SHAP analysis for UL (<xref ref-type="fig" rid="f6"><bold>Figure&#xa0;6a</bold></xref>) further clarified the directionality of its effect. Among UL-positive patients (UL = 1), SHAP values for the high-risk class were predominantly mildly negative, indicating that the model systematically down-weights the predicted probability of high-risk prostate cancer when urinary leukocytes are elevated. In contrast, UL-negative patients (UL = 0) exhibited SHAP values clustered around zero, with a subset showing slightly positive contributions. This finding suggests that, in the presence of abnormal PSA or MRI findings, the absence of urinary inflammatory signals is more compatible with a high-risk phenotype. Importantly, this behavior supports the interpretation of UL as a contextual inflammation marker rather than a direct indicator of tumor aggressiveness.</p>
<p>To illustrate this mechanism at the individual level, we examined a representative high-risk case (sample #14) and plotted paired SHAP waterfall diagrams for models trained without and with UL (<xref ref-type="fig" rid="f6"><bold>Figure&#xa0;6c</bold></xref>). In the baseline model without UL, the predicted probability for class 2 was approximately 0.11. In the model including UL, although this patient was UL-negative and the direct SHAP contribution of UL itself remained close to zero, the overall feature attribution pattern became more sharply aligned with a high-risk profile. Specifically, the positive contributions of established PSA- and MRI-related features, such as p2PSA:Log, PSAD:Tangent, p2PSA, PHID:Sigmoid, and PIRADS:Square, were more coherently expressed, resulting in an increased predicted probability for class 2 of approximately 0.59. This observation indicates that UL does not increase risk by exerting a large direct effect on individual predictions; rather, its inclusion during model&#xa0;training improves the contextual separation between inflammation-related and non-inflammation-related PSA elevations, allowing&#xa0;canonical high-risk features to express their effects more consistently.</p>
<p>Taken together, the SHAP analyses demonstrate that although urinary leukocytes contribute only modestly in terms of global feature importance, their effect is directionally consistent, clinically interpretable, and mechanistically coherent. By delineating the boundary between inflammatory and non-inflammatory causes of PSA elevation, UL refines probability calibration and reduces misattribution of benign PSA increases to aggressive malignancy. Accordingly, UL should be regarded as an inflammation-related contextual modifier within the risk prediction framework, rather than as an independent tumor biomarker for high-risk prostate cancer.</p>
</sec>
</sec>
<sec id="s4" sec-type="discussion">
<label>4</label>
<title>Discussions and conclusion</title>
<p>In this bi-center, real-world cohort, we developed a nonlinear stacking ensemble framework for multi-class prostate cancer risk stratification and demonstrated its robust performance across internal and external datasets. By combining predefined nonlinear feature engineering with stability-oriented LASSO selection, the framework achieved strong discrimination and calibration without reliance on advanced imaging pipelines beyond PI-RADS or on costly omics data. The stacking strategy consistently outperformed individual base learners, yielding multi-class AUCs of approximately 0.96 and 0.93 in the internal and external cohorts, respectively, while maintaining satisfactory cross-center generalizability. These results indicate that integrating heterogeneous learners within a calibrated ensemble can effectively capture complex, nonlinear relationships among routinely available clinical and biochemical variables.</p>
<p>Building on this modeling backbone, we systematically evaluated the incremental contribution of urinary leukocytes (UL), a routinely collected but often overlooked urinalysis parameter. Rather than treating UL as an independent tumor biomarker, we assessed its value in terms of calibration, discrimination, and decision-level utility. Across analyses, UL provided modest but consistent improvements in net clinical benefit, particularly in the clinically ambiguous PSA gray zone (4&#x2013;10 ng/mL), with minimal increase in false-positive classifications. <italic>Post hoc</italic> SHAP analyses conducted on a representative gradient boosting base learner suggested that UL exerts a directionally consistent effect: UL-positive cases tended to receive mildly negative contributions to high-risk predictions, whereas UL-negative cases clustered closer to neutral or slightly positive contributions. Importantly, interpretability analyses were confined to individual base learners and original clinical features, acknowledging that the stacked ensemble itself prioritizes predictive performance over inherent transparency. Within this scope, the observed patterns support a clinically intuitive role of UL as an inflammation-related contextual modifier that refines risk estimation by helping distinguish benign PSA elevations from patterns more compatible with clinically significant disease.</p>
<p>Several limitations warrant consideration. Although data were obtained from two centers, subgroup sample sizes&#x2014;particularly among UL-positive patients and those with PSA &gt;20 ng/mL&#x2014;remain limited, which may reduce the stability of subgroup-level estimates. In addition, UL was treated as a semi-quantitative, essentially binary variable derived from routine urinalysis, potentially underrepresenting the full spectrum of urinary inflammatory activity and precluding exploration of dose&#x2013;response effects. Finally, the retrospective design introduces the possibility of unmeasured confounding and spectrum bias despite external validation. Future studies with larger, prospectively collected cohorts and more granular urinary inflammatory markers are needed to further validate these findings and to clarify how such information can best support biopsy decision-making.</p>
<p>Overall, this work highlights a pragmatic strategy for evaluating the incremental clinical utility of inexpensive, noisy clinical variables within modern machine learning pipelines by explicitly linking feature inclusion to decision-analytic benefit rather than predictive performance alone.</p>
</sec>
</body>
<back>
<sec id="s5" sec-type="data-availability">
<title>Data availability statement</title>
<p>The raw data supporting the conclusions of this article will be made available by the authors, without undue reservation.</p></sec>
<sec id="s6" sec-type="ethics-statement">
<title>Ethics statement</title>
<p>The studies involving humans were approved by Ethics Committee of Tongji Hospital, Tongji Medical College, Huazhong University of Science and Technology (approval No. TJ-IRB202303129). The studies were conducted in accordance with the local legislation and institutional requirements. The participants provided their written informed consent to participate in this study. The animal study was approved by Ethics Committee of Tongji Hospital, Tongji Medical College, Huazhong University of Science and Technology (approval No. TJ-IRB202303129). The study was conducted in accordance with the local legislation and institutional requirements. Written informed consent was obtained from the individual(s) for the publication of any potentially identifiable images or data included in this article.</p></sec>
<sec id="s7" sec-type="author-contributions">
<title>Author contributions</title>
<p>SX: Formal analysis, Writing &#x2013; original draft.. ZR: Data curation, Methodology, Resources, Visualization, Writing &#x2013; original draft. MC: Investigation, Project administration, Resources, Software, Writing &#x2013; original draft. HZ: Software, Writing &#x2013; review &amp; editing. CY: Data curation, Resources, Supervision, Writing &#x2013; review &amp; editing. XW: Data curation, Resources, Supervision, Validation, Writing &#x2013; review &amp; editing.</p></sec>
<ack>
<title>Acknowledgments</title>
<p>The authors are grateful to the doctors in the Department of Urology, Wuhan Tongji Hospital, Tongji Medical College, Huazhong University of Science and Technology for their support in collecting the clinical data.</p>
</ack>
<sec id="s9" sec-type="COI-statement">
<title>Conflict of interest</title>
<p>Author MC was employed by the company Aerospace Nanhu Electronic Information Technology Co., Ltd.</p>
<p>The remaining author(s) declared that this work was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p></sec>
<sec id="s10" sec-type="ai-statement">
<title>Generative AI statement</title>
<p>The author(s) declared that generative AI was not used in the creation of this manuscript.</p>
<p>Any alternative text (alt text) provided alongside figures in this article has been generated by Frontiers with the support of artificial intelligence and reasonable efforts have been made to ensure accuracy, including review by the authors wherever possible. If you identify any issues, please contact us.</p></sec>
<sec id="s11" sec-type="disclaimer">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p></sec>
<sec id="s12" sec-type="supplementary-material">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fonc.2026.1762494/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fonc.2026.1762494/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="DataSheet1.docx" id="SF1" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document"><label>Supplementary Figure&#xa0;1</label>
<caption>
<p>Distribution of predicted high-risk probabilities in the PSA 4&#x2013;10 ng/mL gray zone among non-high-risk patients. Histograms show the distribution of predicted probabilities for high-risk prostate cancer (class 2) among patients with PSA levels between 4 and 10 ng/mL who were histologically confirmed as non-high-risk (Gleason score &lt; 8). Results are shown separately for the internal test cohort (left) and the external validation cohort (right). Blue bars represent predictions from the base model without urinary leukocytes (UL), while orange bars represent predictions from the model incorporating UL. The vertical dashed line indicates the prespecified decision threshold (p = 0.5) used for high-risk classification. In both cohorts, the majority of non-high-risk patients exhibit low predicted probabilities well below the decision threshold. Incorporation of UL primarily reshapes the lower-probability distribution rather than inducing additional high-risk classifications. Notably, no non-high-risk patients in either cohort crossed the high-risk threshold after inclusion of UL, indicating that UL does not increase false-positive high-risk predictions in the PSA gray-zone population.</p>
</caption></supplementary-material>
<supplementary-material xlink:href="DataSheet1.docx" id="SF2" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document"><label>Supplementary Table&#xa0;1</label>
<caption>
<p>Features with various nonlinear transformations.</p>
</caption></supplementary-material></sec>
<ref-list>
<title>References</title>
<ref id="B1">
<label>1</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Sung</surname> <given-names>H</given-names></name>
<name><surname>Ferlay</surname> <given-names>J</given-names></name>
<name><surname>Siegel</surname> <given-names>RL</given-names></name>
<name><surname>Laversanne</surname> <given-names>M</given-names></name>
<name><surname>Soerjomataram</surname> <given-names>I</given-names></name>
<name><surname>Jemal</surname> <given-names>A</given-names></name>
<etal/>
</person-group>. 
<article-title>Global cancer statistics 2020: GLOBOCAN estimates of incidence and mortality worldwide for 36 cancers in 185 countries</article-title>. <source>CA Cancer J Clin</source>. (<year>2021</year>) <volume>71</volume>:<page-range>209&#x2013;49</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.3322/caac.21660</pub-id>, PMID: <pub-id pub-id-type="pmid">33538338</pub-id>
</mixed-citation>
</ref>
<ref id="B2">
<label>2</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Sungur</surname> <given-names>M</given-names></name>
<name><surname>Aykac</surname> <given-names>A</given-names></name>
<name><surname>Aydin</surname> <given-names>ME</given-names></name>
<name><surname>Celik</surname> <given-names>O</given-names></name>
<name><surname>Kaya</surname> <given-names>C</given-names></name>
</person-group>. 
<article-title>Machine learning-based prediction of prostate biopsy necessity using PSA, MRI, and hematologic parameters</article-title>. <source>J Clin Med</source>. (<year>2024</year>) <volume>14</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/jcm14010183</pub-id>, PMID: <pub-id pub-id-type="pmid">39797267</pub-id>
</mixed-citation>
</ref>
<ref id="B3">
<label>3</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Wu</surname> <given-names>X</given-names></name>
<name><surname>Liu</surname> <given-names>Z</given-names></name>
<name><surname>Fang</surname> <given-names>Y</given-names></name>
<name><surname>Guoping</surname> <given-names>X</given-names></name>
<name><surname>Zhihua</surname> <given-names>Q</given-names></name>
<name><surname>Hu</surname> <given-names>Z</given-names></name>
<etal/>
</person-group>. 
<article-title>Multimodal nomogram combining multiparametric MRI, functional subsets of peripheral lymphocytes and PI-RADS can predict risk stratification of prostate cancer</article-title>. <source>Comput Methods Programs Biomedicine</source>. (<year>2026</year>) <volume>273</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.cmpb.2025.109086</pub-id>, PMID: <pub-id pub-id-type="pmid">41046708</pub-id>
</mixed-citation>
</ref>
<ref id="B4">
<label>4</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Fujita</surname> <given-names>K</given-names></name>
<name><surname>Hosomi</surname> <given-names>M</given-names></name>
<name><surname>Tanigawa</surname> <given-names>G</given-names></name>
<name><surname>Okumi</surname> <given-names>M</given-names></name>
<name><surname>Fushimi</surname> <given-names>H</given-names></name>
<name><surname>Yamaguchi</surname> <given-names>S</given-names></name>
</person-group>. 
<article-title>Prostatic inflammation detected in initial biopsy specimens and urinary pyuria are predictors of negative repeat prostate biopsy</article-title>. <source>J Urol</source>. (<year>2011</year>) <volume>185</volume>:<page-range>1722&#x2013;7</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.juro.2010.12.058</pub-id>, PMID: <pub-id pub-id-type="pmid">21420119</pub-id>
</mixed-citation>
</ref>
<ref id="B5">
<label>5</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Fujita</surname> <given-names>K</given-names></name>
<name><surname>Nonomura</surname> <given-names>N</given-names></name>
</person-group>. 
<article-title>Urinary biomarkers of prostate cancer</article-title>. <source>Int J Urol</source>. (<year>2018</year>) <volume>25</volume>:<page-range>770&#x2013;9</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/iju.13734</pub-id>, PMID: <pub-id pub-id-type="pmid">30129068</pub-id>
</mixed-citation>
</ref>
<ref id="B6">
<label>6</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Nepal</surname> <given-names>A</given-names></name>
<name><surname>Sharma</surname> <given-names>P</given-names></name>
<name><surname>Bhattarai</surname> <given-names>S</given-names></name>
<name><surname>Mahajan</surname> <given-names>Z</given-names></name>
<name><surname>Sharma</surname> <given-names>A</given-names></name>
<name><surname>Sapkota</surname> <given-names>A</given-names></name>
<etal/>
</person-group>. 
<article-title>Extremely elevated prostate-specific antigen in acute prostatitis: A case report</article-title>. <source>Cureus</source>. (<year>2023</year>) <volume>15</volume>:<fpage>e43730</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.7759/cureus.43730</pub-id>, PMID: <pub-id pub-id-type="pmid">37727194</pub-id>
</mixed-citation>
</ref>
<ref id="B7">
<label>7</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Demir</surname> <given-names>S</given-names></name>
</person-group>. 
<article-title>Role of sterile pyuria in association to elevated PSA values in the diagnosis of non-palpable prostate cancer</article-title>? <source>Arch Ital Urol Androl</source>. (<year>2019</year>) <volume>91</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.4081/aiua.2019.3.167</pub-id>, PMID: <pub-id pub-id-type="pmid">31577101</pub-id>
</mixed-citation>
</ref>
<ref id="B8">
<label>8</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Yang</surname> <given-names>C</given-names></name>
<name><surname>Liu</surname> <given-names>Z</given-names></name>
<name><surname>Fang</surname> <given-names>Y</given-names></name>
<name><surname>Cao</surname> <given-names>X</given-names></name>
<name><surname>Xu</surname> <given-names>G</given-names></name>
<name><surname>Wang</surname> <given-names>Z</given-names></name>
<etal/>
</person-group>. 
<article-title>Development and validation of a clinic machine-learning nomogram for the prediction of risk stratifications of prostate cancer based on functional subsets of peripheral lymphocyte</article-title>. <source>J Transl Med</source>. (<year>2023</year>) <volume>21</volume>:<fpage>465</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s12967-023-04318-w</pub-id>, PMID: <pub-id pub-id-type="pmid">37438820</pub-id>
</mixed-citation>
</ref>
<ref id="B9">
<label>9</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Cao</surname> <given-names>X</given-names></name>
<name><surname>Fang</surname> <given-names>Y</given-names></name>
<name><surname>Yang</surname> <given-names>C</given-names></name>
<name><surname>Liu</surname> <given-names>Z</given-names></name>
<name><surname>Xu</surname> <given-names>G</given-names></name>
<name><surname>Jiang</surname> <given-names>Y</given-names></name>
<etal/>
</person-group>. 
<article-title>Prediction of prostate cancer risk stratification based on A nonlinear transformation stacking learning strategy</article-title>. <source>Int Neurourol J Mar</source>. (<year>2024</year>) <volume>28</volume>:<fpage>33</fpage>&#x2013;<lpage>43</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.5213/inj.2346332.166</pub-id>, PMID: <pub-id pub-id-type="pmid">38569618</pub-id>
</mixed-citation>
</ref>
<ref id="B10">
<label>10</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Mamidi</surname> <given-names>YKK</given-names></name>
<name><surname>Mamidi</surname> <given-names>TKK</given-names></name>
<name><surname>Kabir</surname> <given-names>MWU</given-names></name>
<name><surname>Wu</surname> <given-names>J</given-names></name>
<name><surname>Hoque</surname> <given-names>MT</given-names></name>
<name><surname>Hicks</surname> <given-names>C</given-names></name>
</person-group>. 
<article-title>PCa-clf: A classifier of prostate cancer patients into patients with indolent and aggressive tumors using machine learning</article-title>. <source>Mach Learn Knowledge Extraction</source>. (<year>2023</year>) <volume>5</volume>:<page-range>1302&#x2013;19</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/make5040066</pub-id>, PMID: <pub-id pub-id-type="pmid">41725453</pub-id>
</mixed-citation>
</ref>
<ref id="B11">
<label>11</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Chen</surname> <given-names>T</given-names></name>
<name><surname>Kabir</surname> <given-names>MF</given-names></name>
</person-group>. 
<article-title>Explainable machine learning approach for cancer prediction through binarilization of RNA sequencing data</article-title>. <source>PloS One</source>. (<year>2024</year>) <volume>19</volume>:<fpage>e0302947</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1371/journal.pone.0302947</pub-id>, PMID: <pub-id pub-id-type="pmid">38728288</pub-id>
</mixed-citation>
</ref>
<ref id="B12">
<label>12</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Shu</surname> <given-names>X</given-names></name>
<name><surname>Liu</surname> <given-names>Y</given-names></name>
<name><surname>Qiao</surname> <given-names>X</given-names></name>
<name><surname>Ai</surname> <given-names>G</given-names></name>
<name><surname>Liu</surname> <given-names>L</given-names></name>
<name><surname>Liao</surname> <given-names>J</given-names></name>
<etal/>
</person-group>. 
<article-title>Radiomic-based machine learning model for the accurate prediction of prostate cancer risk stratification</article-title>. <source>Br J Radiol</source>. (<year>2023</year>) <volume>96</volume>:<elocation-id>20220238</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1259/bjr.20220238</pub-id>, PMID: <pub-id pub-id-type="pmid">36475858</pub-id>
</mixed-citation>
</ref>
<ref id="B13">
<label>13</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Chou</surname> <given-names>YJ</given-names></name>
<name><surname>Jong</surname> <given-names>BE</given-names></name>
<name><surname>Tsai</surname> <given-names>YC</given-names></name>
</person-group>. 
<article-title>Integrating PSA change with PSA density enhances diagnostic accuracy and helps avoid unnecessary prostate biopsies</article-title>. <source>Diagnostics (Basel)</source>. (<year>2025</year>) <volume>15</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/diagnostics15162027</pub-id>, PMID: <pub-id pub-id-type="pmid">40870878</pub-id>
</mixed-citation>
</ref>
<ref id="B14">
<label>14</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Stephan</surname> <given-names>C</given-names></name>
<name><surname>Vincendeau</surname> <given-names>S</given-names></name>
<name><surname>Houlgatte</surname> <given-names>A</given-names></name>
<name><surname>Cammann</surname> <given-names>H</given-names></name>
<name><surname>Jung</surname> <given-names>K</given-names></name>
<name><surname>Semjonow</surname> <given-names>A</given-names></name>
</person-group>. 
<article-title>Multicenter evaluation of [-2]proprostate-specific antigen and the prostate health index for detecting prostate cancer</article-title>. <source>Clin Chem</source>. (<year>2013</year>) <volume>59</volume>:<page-range>306&#x2013;14</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1373/clinchem.2012.195784</pub-id>, PMID: <pub-id pub-id-type="pmid">23213080</pub-id>
</mixed-citation>
</ref>
<ref id="B15">
<label>15</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Nieboer</surname> <given-names>D</given-names></name>
<name><surname>Vergouwe</surname> <given-names>Y</given-names></name>
<name><surname>Roobol</surname> <given-names>MJ</given-names></name>
<name><surname>Auvinen</surname> <given-names>E</given-names></name>
<name><surname>Kattan</surname> <given-names>S</given-names></name>
<name><surname>van der Kwast</surname> <given-names>P</given-names></name>
<etal/>
</person-group>. 
<article-title>Nonlinear modeling was applied thoughtfully for risk prediction: the Prostate Biopsy Collaborative Group</article-title>. <source>J Clin Epidemiol</source>. (<year>2015</year>) <volume>68</volume>:<page-range>426&#x2013;34</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.jclinepi.2014.11.022</pub-id>, PMID: <pub-id pub-id-type="pmid">25777297</pub-id>
</mixed-citation>
</ref>
<ref id="B16">
<label>16</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Wu</surname> <given-names>J</given-names></name>
<name><surname>Jin</surname> <given-names>X</given-names></name>
<name><surname>Li</surname> <given-names>J</given-names></name>
<name><surname>Zhang</surname> <given-names>Y</given-names></name>
<name><surname>Wang</surname> <given-names>Q</given-names></name>
<name><surname>Li</surname> <given-names>H</given-names></name>
<etal/>
</person-group>. 
<article-title>Development and validation of a prostate cancer risk prediction model for the elevated PSA population</article-title>. <source>Front Oncol</source>. (<year>2025</year>) <volume>15</volume>:<elocation-id>1599266</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fonc.2025.1599266</pub-id>, PMID: <pub-id pub-id-type="pmid">41030951</pub-id>
</mixed-citation>
</ref>
<ref id="B17">
<label>17</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Tibshirani</surname> <given-names>R</given-names></name>
</person-group>. 
<article-title>Regression shrinkage and selection via the lasso</article-title>. <source>J R Stat Soc Ser B: Stat Methodology</source>. (<year>1996</year>) <volume>58</volume>:<page-range>267&#x2013;88</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/j.2517-6161.1996.tb02080.x</pub-id>, PMID: <pub-id pub-id-type="pmid">41738386</pub-id>
</mixed-citation>
</ref>
<ref id="B18">
<label>18</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Lu</surname> <given-names>W</given-names></name>
<name><surname>Zhao</surname> <given-names>L</given-names></name>
<name><surname>Wang</surname> <given-names>S</given-names></name>
<name><surname>Zhang</surname> <given-names>J</given-names></name>
<name><surname>Li</surname> <given-names>M</given-names></name>
<name><surname>Xu</surname> <given-names>Y</given-names></name>
<etal/>
</person-group>. 
<article-title>Explainable and visualizable machine learning models to predict biochemical recurrence of prostate cancer</article-title>. <source>Clin Transl Oncol</source>. (<year>2024</year>) <volume>26</volume>:<page-range>2369&#x2013;79</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s12094-024-03480-x</pub-id>, PMID: <pub-id pub-id-type="pmid">38602643</pub-id>
</mixed-citation>
</ref>
<ref id="B19">
<label>19</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Fuadah</surname> <given-names>YN</given-names></name>
<name><surname>Pramudito</surname> <given-names>MA</given-names></name>
<name><surname>Lim</surname> <given-names>KM</given-names></name>
</person-group>. 
<article-title>An optimal approach for heart sound classification using grid search in hyperparameter optimization of machine learning</article-title>. <source>Bioengineering (Basel)</source>. (<year>2022</year>) <volume>10</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/bioengineering10010045</pub-id>, PMID: <pub-id pub-id-type="pmid">36671616</pub-id>
</mixed-citation>
</ref>
<ref id="B20">
<label>20</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Nagarajan</surname> <given-names>R</given-names></name>
<name><surname>Upreti</surname> <given-names>M</given-names></name>
</person-group>. 
<article-title>An approach for deciphering patient-specific variations with application to breast cancer molecular expression profiles</article-title>. <source>J BioMed Inform. Oct</source>. (<year>2016</year>) <volume>63</volume>:<page-range>120&#x2013;30</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.jbi.2016.07.022</pub-id>, PMID: <pub-id pub-id-type="pmid">27477838</pub-id>
</mixed-citation>
</ref>
<ref id="B21">
<label>21</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Yan</surname> <given-names>F</given-names></name>
<name><surname>Feng</surname> <given-names>Y</given-names></name>
</person-group>. 
<article-title>A two-stage stacked-based heterogeneous ensemble learning for cancer survival prediction</article-title>. <source>Complex Intelligent Systems</source>. (<year>2022</year>) <volume>8</volume>:<page-range>4619&#x2013;39</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s40747-022-00791-w</pub-id>, PMID: <pub-id pub-id-type="pmid">41737715</pub-id>
</mixed-citation>
</ref>
<ref id="B22">
<label>22</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Cao-Van</surname> <given-names>K</given-names></name>
<name><surname>Minh</surname> <given-names>TC</given-names></name>
<name><surname>Minh</surname> <given-names>LG</given-names></name>
<name><surname>Quyen</surname> <given-names>TTB</given-names></name>
<name><surname>Tan</surname> <given-names>HM</given-names></name>
</person-group>. 
<article-title>Soft-voting ensemble model: an efficient learning approach for predictive prostate cancer risk</article-title>. <source>Vietnam J Comput Science</source>. (<year>2024</year>) <volume>11</volume>:<page-range>531&#x2013;52</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1142/s2196888824500155</pub-id>, PMID: <pub-id pub-id-type="pmid">40951326</pub-id>
</mixed-citation>
</ref>
<ref id="B23">
<label>23</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Kadam</surname> <given-names>VJ</given-names></name>
<name><surname>Jadhav</surname> <given-names>SM</given-names></name>
<name><surname>Vijayakumar</surname> <given-names>K</given-names></name>
</person-group>. 
<article-title>Breast cancer diagnosis using feature ensemble learning based on stacked sparse autoencoders and softmax regression</article-title>. <source>J Med Syst</source>. (<year>2019</year>) <volume>43</volume>:<fpage>263</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s10916-019-1397-z</pub-id>, PMID: <pub-id pub-id-type="pmid">31270634</pub-id>
</mixed-citation>
</ref>
<ref id="B24">
<label>24</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Tsokani</surname> <given-names>S</given-names></name>
<name><surname>Veroniki</surname> <given-names>AA</given-names></name>
<name><surname>Pandis</surname> <given-names>N</given-names></name>
<name><surname>Mavridis</surname> <given-names>D</given-names></name>
</person-group>. 
<article-title>Assessing the performance of diagnostic test accuracy measures</article-title>. <source>Am J Orthod Dentofacial Orthop</source>. (<year>2022</year>) <volume>161</volume>:<page-range>748&#x2013;51</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.ajodo.2021.12.007</pub-id>, PMID: <pub-id pub-id-type="pmid">35473837</pub-id>
</mixed-citation>
</ref>
<ref id="B25">
<label>25</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Han</surname> <given-names>JH</given-names></name>
<name><surname>Lee</surname> <given-names>S</given-names></name>
<name><surname>Lee</surname> <given-names>B</given-names></name>
<name><surname>Kim</surname> <given-names>M</given-names></name>
<name><surname>Park</surname> <given-names>J</given-names></name>
<name><surname>Cho</surname> <given-names>Y</given-names></name>
<etal/>
</person-group>. 
<article-title>Explainable ML models for a deeper insight on treatment decision for localized prostate cancer</article-title>. <source>Sci Rep</source>. (<year>2023</year>) <volume>13</volume>:<fpage>11532</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41598-023-38162-1</pub-id>, PMID: <pub-id pub-id-type="pmid">37460568</pub-id>
</mixed-citation>
</ref>
</ref-list>
<fn-group>
<fn id="n1" fn-type="custom" custom-type="edited-by">
<p>Edited by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1009577">Andrea Zivi</ext-link>, Imperial College London, United Kingdom</p></fn>
<fn id="n2" fn-type="custom" custom-type="reviewed-by">
<p>Reviewed by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/700491">Pedro Matos-Filipe</ext-link>, Pompeu Fabra University, Spain</p>
<p><ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/2054889">Tatsushi Kawada</ext-link>, Medical University of Vienna, Austria</p></fn>
</fn-group>
</back>
</article>