<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.3 20210610//EN" "JATS-journalpublishing1-3-mathml3.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:ali="http://www.niso.org/schemas/ali/1.0/" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="1.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Oncol.</journal-id>
<journal-title-group>
<journal-title>Frontiers in Oncology</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Oncol.</abbrev-journal-title>
</journal-title-group>
<issn pub-type="epub">2234-943X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fonc.2026.1775750</article-id>
<article-version article-version-type="Version of Record" vocab="NISO-RP-8-2008"/>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Original Research</subject>
</subj-group>
</article-categories>
<title-group>
<article-title>A foundation model-based multi-instance learning framework for accurate prediction of lymph node metastasis in prostate cancer from whole slide images</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name><surname>Zeng</surname><given-names>Guang</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="validation" vocab-term-identifier="https://credit.niso.org/contributor-roles/validation/">Validation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="software" vocab-term-identifier="https://credit.niso.org/contributor-roles/software/">Software</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="supervision" vocab-term-identifier="https://credit.niso.org/contributor-roles/supervision/">Supervision</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Li</surname><given-names>Weiwei</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Project-administration" vocab-term-identifier="https://credit.niso.org/contributor-roles/project-administration/">Project administration</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="software" vocab-term-identifier="https://credit.niso.org/contributor-roles/software/">Software</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="validation" vocab-term-identifier="https://credit.niso.org/contributor-roles/validation/">Validation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="supervision" vocab-term-identifier="https://credit.niso.org/contributor-roles/supervision/">Supervision</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Mei</surname><given-names>Haonan</given-names></name>
<xref ref-type="aff" rid="aff5"><sup>5</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/3064752/overview"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="software" vocab-term-identifier="https://credit.niso.org/contributor-roles/software/">Software</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="resources" vocab-term-identifier="https://credit.niso.org/contributor-roles/resources/">Resources</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Du</surname><given-names>Ran</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>*</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/3372792/overview"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Project-administration" vocab-term-identifier="https://credit.niso.org/contributor-roles/project-administration/">Project administration</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="visualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/visualization/">Visualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="validation" vocab-term-identifier="https://credit.niso.org/contributor-roles/validation/">Validation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Funding acquisition" vocab-term-identifier="https://credit.niso.org/contributor-roles/funding-acquisition/">Funding acquisition</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="resources" vocab-term-identifier="https://credit.niso.org/contributor-roles/resources/">Resources</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
</contrib>
</contrib-group>
<aff id="aff1"><label>1</label><institution>Division of Urology, The Central Hospital of Enshi Tujia and Miao Autonomous Prefecture</institution>, <city>Enshi</city>, <state>Hubei</state>,&#xa0;<country country="cn">China</country></aff>
<aff id="aff2"><label>2</label><institution>Division of Nephrology, The Central Hospital of Enshi Tujia and Miao Autonomous Prefecture</institution>, <city>Enshi</city>, <state>Hubei</state>,&#xa0;<country country="cn">China</country></aff>
<aff id="aff3"><label>3</label><institution>Hubei Selenium and Human Health Institute, The Central Hospital of Enshi Tujia and Miao Autonomous Prefecture</institution>, <city>Enshi</city>,&#xa0;<country country="cn">China</country></aff>
<aff id="aff4"><label>4</label><institution>Hubei Provincial Key Lab of Selenium Resources and Bioapplications</institution>, <city>Enshi</city>,&#xa0;<country country="cn">China</country></aff>
<aff id="aff5"><label>5</label><institution>The First Clinical College, Wuhan University</institution>, <city>Wuhan</city>, <state>Hubei</state>,&#xa0;<country country="cn">China</country></aff>
<author-notes>
<corresp id="c001"><label>*</label>Correspondence: Ran Du, <email xlink:href="mailto:duran19881025@163.com">duran19881025@163.com</email></corresp>
</author-notes>
<pub-date publication-format="electronic" date-type="pub" iso-8601-date="2026-03-04">
<day>04</day>
<month>03</month>
<year>2026</year>
</pub-date>
<pub-date publication-format="electronic" date-type="collection">
<year>2026</year>
</pub-date>
<volume>16</volume>
<elocation-id>1775750</elocation-id>
<history>
<date date-type="received">
<day>26</day>
<month>12</month>
<year>2025</year>
</date>
<date date-type="accepted">
<day>13</day>
<month>02</month>
<year>2026</year>
</date>
<date date-type="rev-recd">
<day>04</day>
<month>02</month>
<year>2026</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2026 Zeng, Li, Mei and Du.</copyright-statement>
<copyright-year>2026</copyright-year>
<copyright-holder>Zeng, Li, Mei and Du</copyright-holder>
<license>
<ali:license_ref start_date="2026-03-04">https://creativecommons.org/licenses/by/4.0/</ali:license_ref>
<license-p>This is an open-access article distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">Creative Commons Attribution License (CC BY)</ext-link>. The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</license-p>
</license>
</permissions>
<abstract>
<sec>
<title>Background</title>
<p>Nodal involvement (N stage) is a key prognostic factor in prostate cancer (PCa). Conventional imaging and histopathology often have limited sensitivity and inter-observer variability. AI-based computational pathology, using multi-instance learning (MIL) and foundation models, offers a promising approach for accurate and interpretable N stage prediction from H&amp;E-stained whole slide images (WSIs).</p>
</sec>
<sec>
<title>Methods</title>
<p>In this multicenter retrospective study, we developed a weakly supervised deep learning framework integrating MIL with domain-adapted foundation model encoders (UNI-v2, CONCH, ResNet-50) to predict N stage. WSIs from 280 RHWU patients were used for training and 306 TCGA patients for external validation. Attention heatmaps enabled interpretability, while transcriptomic analyses explored molecular correlates via differential expression and bioinformation analysis.</p>
</sec>
<sec>
<title>Results</title>
<p>The UNI-v2-based model achieved the highest performance (AUC 0.879 in RHWU, 0.850 in TCGA), surpassing CONCH and ResNet-50. Attention heatmaps highlighted tumor-stromal interfaces and poorly differentiated tumor clusters. Transcriptomic analysis identified 94 differentially expressed genes; upregulated genes were enriched in cell cycle, and immune pathways, while downregulated genes involved ion transport and metabolism.</p>
</sec>
<sec>
<title>Conclusions</title>
<p>This AI-MIL framework accurately predicts nodal involvement in PCa and provides biologically interpretable insights, supporting its potential as a precision oncology tool for risk stratification and treatment planning.</p>
</sec>
</abstract>
<kwd-group>
<kwd>artificial intelligence</kwd>
<kwd>computational pathology</kwd>
<kwd>lymph node metastasis</kwd>
<kwd>multi-instance learning</kwd>
<kwd>N staging</kwd>
<kwd>prostate cancer</kwd>
</kwd-group>
<funding-group>
<funding-statement>The author(s) declared that financial support was received for this work and/or its publication. This work was supported by Natural Science Foundation of Enshi Tujia and Miao Autonomous Prefecture Government (D20230060). </funding-statement>
</funding-group>
<counts>
<fig-count count="7"/>
<table-count count="2"/>
<equation-count count="0"/>
<ref-count count="29"/>
<page-count count="12"/>
<word-count count="5120"/>
</counts>
<custom-meta-group>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Genitourinary Oncology</meta-value>
</custom-meta>
</custom-meta-group>
</article-meta>
</front>
<body>
<sec id="s1" sec-type="intro">
<label>1</label>
<title>Introduction</title>
<p>Prostate cancer (PCa) is the second most frequently diagnosed malignancy and the fifth leading cause of cancer-related death among men worldwide (<xref ref-type="bibr" rid="B1">1</xref>). According to global cancer statistics, over 1.4 million new cases and 313,780 deaths were reported in 2025, with incidence continuing to rise due to population aging and improved diagnostic strategies (<xref ref-type="bibr" rid="B2">2</xref>). With an aging population worldwide, the volume of prostate biopsy specimens is expected to increase dramatically (<xref ref-type="bibr" rid="B3">3</xref>). Despite advances in imaging and systemic therapy, accurate staging remains essential for determining treatment strategies and predicting outcomes in PCa patients (<xref ref-type="bibr" rid="B4">4</xref>). Among the staging components, nodal involvement (N stage) is particularly critical, as lymph node metastasis is strongly associated with biochemical recurrence, distant progression, and reduced cancer-specific survival (<xref ref-type="bibr" rid="B5">5</xref>). Patients with positive lymph nodes often require multimodal treatment strategies, including androgen deprivation therapy, radiation, or systemic chemotherapy, in addition to radical prostatectomy (<xref ref-type="bibr" rid="B6">6</xref>).</p>
<p>Current evaluation of N stage primarily relies on preoperative imaging modalities such as computed tomography (CT), magnetic resonance imaging (MRI) (<xref ref-type="bibr" rid="B7">7</xref>), and prostate-specific membrane antigen positron emission tomography (PSMA-PET) (<xref ref-type="bibr" rid="B8">8</xref>). While PSMA-PET has demonstrated superior sensitivity compared with conventional imaging, its availability is limited in many regions, and its specificity remains imperfect. Histopathological examination of lymph nodes obtained during pelvic lymph node dissection (PLND) remains the gold standard; however, PLND is invasive and associated with perioperative risks. Furthermore, histological assessment of H&amp;E-stained sections is subject to inter-observer variability, and small metastatic foci may be missed in routine practice (<xref ref-type="bibr" rid="B9">9</xref>). These limitations highlight the unmet need for accurate, scalable, and reproducible tools to predict nodal status in PCa.</p>
<p>Artificial intelligence (AI), particularly deep learning applied to digital pathology, has emerged as a transformative approach in oncological diagnostics (<xref ref-type="bibr" rid="B10">10</xref>). By leveraging whole slide images (WSIs), AI can capture subtle morphological patterns beyond the recognition of human observers. Multiple-Instance Learning (MIL), a weakly supervised paradigm, is particularly suitable for WSI analysis, as it requires only slide-level labels (e.g., N-positive vs. N-negative) without the need for exhaustive region-level annotation (<xref ref-type="bibr" rid="B11">11</xref>, <xref ref-type="bibr" rid="B12">12</xref>). Recent developments in foundation models&#x2014;large-scale pretrained encoders specifically adapted to histopathology&#x2014;further enhance feature extraction, enabling generalizable and domain-specific representations of tissue morphology. Integrating MIL with pathology foundation models therefore represents a promising avenue for building robust, interpretable, and clinically deployable models for nodal staging in PCa. Beyond prediction, linking computational pathology findings with molecular alterations offers an opportunity to deepen biological understanding and identify novel biomarkers. Transcriptomic profiling from The Cancer Genome Atlas (TCGA) has revealed distinct molecular subtypes and immune landscapes of PCa, and integration with AI-derived predictions may provide mechanistic insights. In particular, exploring differentially expressed genes (DEGs), functional enrichment pathways, and immune infiltration profiles between N-positive and N-negative patients could illuminate tumor&#x2013;immune interactions that drive metastatic dissemination (<xref ref-type="bibr" rid="B13">13</xref>).</p>
<p>In this study, we proposed a foundation model&#x2013;based MIL framework for predicting N stage in prostate cancer from H&amp;E-stained WSIs, using multicenter cohorts from RHWU and TCGA. Our objectives were threefold: (i) to develop and validate a weakly supervised model for slide-level prediction of nodal involvement, (ii) to provide interpretability through attention heatmaps highlighting predictive histological regions, and (iii) to perform exploratory bioinformatics analyses for uncovering potential molecular and immune correlates of nodal metastasis. This work aims to bridge the gap between computational pathology and translational oncology, ultimately supporting precision medicine in PCa management.</p>
</sec>
<sec id="s2">
<label>2</label>
<title>Methods</title>
<sec id="s3_1">
<label>2.1</label>
<title>Patient cohorts</title>
<p>This multicenter retrospective study analyzed two independent prostate cancer cohorts. The internal dataset comprised 280 patients who underwent radical prostatectomy at the Renmin Hospital of Wuhan University (RHWU, Wuhan, China) between 2018 and 2023. Eligible patients were required to have histologically confirmed prostate adenocarcinoma, complete clinicopathological information including postoperative nodal status, and diagnostic-grade hematoxylin and eosin (H&amp;E)-stained WSIs containing more than 10% tumor area. Patients who had received neoadjuvant therapy prior to surgery were excluded. The external validation cohort consisted of 306 prostate adenocarcinoma patients from the TCGA-PRAD database, accessed in April 2024. This cohort provided both digitized WSIs and matched RNA sequencing data. Clinical information, including patient age, preoperative prostate-specific antigen (PSA) levels, Gleason grade, and TNM stage, was collected for all cases. Detailed cohort information is presented in <xref ref-type="fig" rid="f1"><bold>Figure&#xa0;1</bold></xref> and <xref ref-type="table" rid="T1"><bold>Table&#xa0;1</bold></xref>.</p>
<fig id="f1" position="float">
<label>Figure&#xa0;1</label>
<caption>
<p>Demographic and staging systems in prostate cancer patients. Pri Gle for primary Gleason Score, Sec Gle for Secondary Gleason Score, T, N, and M for tumor TNM stage system.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-16-1775750-g001.tif">
<alt-text content-type="machine-generated">Grid of ten donut charts compares percentages for Pri Gleason, Sec Gleason, T, N, and M variables across RHWU and TCGA cohorts. Distinct colors represent each pattern or group as shown in the key.</alt-text>
</graphic></fig>
<table-wrap id="T1" position="float">
<label>Table&#xa0;1</label>
<caption>
<p>The distributions of demographic and clinicopathologic characteristics of patients.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" align="left"/>
<th valign="middle" align="left">RHWU (N = 280)</th>
<th valign="middle" align="left">TCGA (N = 306)</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="left">Age (Years)</td>
<td valign="middle" align="left">74.1 &#xb1; 7.9</td>
<td valign="middle" align="left">61.0 &#xb1; 6.8</td>
</tr>
<tr>
<th valign="middle" colspan="3" align="left">Median pre-op PSA (ng/mL)</th>
</tr>
<tr>
<td valign="middle" align="left">tPSA</td>
<td valign="middle" align="left">39.7 &#xb1; 52.8</td>
<td valign="middle" align="left">na</td>
</tr>
<tr>
<td valign="middle" align="left">cPSA</td>
<td valign="middle" align="left">31.2 &#xb1; 18.6</td>
<td valign="middle" align="left">na</td>
</tr>
<tr>
<th valign="middle" colspan="3" align="left">TNM stage</th>
</tr>
<tr>
<td valign="middle" align="left">T2</td>
<td valign="middle" align="left">28.2%</td>
<td valign="middle" align="left">83.9%</td>
</tr>
<tr>
<td valign="middle" align="left">T3</td>
<td valign="middle" align="left">46.0%</td>
<td valign="middle" align="left">11.8%</td>
</tr>
<tr>
<td valign="middle" align="left">T4</td>
<td valign="middle" align="left">25.8%</td>
<td valign="middle" align="left">4.3%</td>
</tr>
<tr>
<td valign="middle" align="left">N0</td>
<td valign="middle" align="left">60.5%</td>
<td valign="middle" align="left">76.4%</td>
</tr>
<tr>
<td valign="middle" align="left">N1</td>
<td valign="middle" align="left">39.4%</td>
<td valign="middle" align="left">23.5%</td>
</tr>
<tr>
<td valign="middle" align="left">M0</td>
<td valign="middle" align="left">78.3%</td>
<td valign="middle" align="left">93.3%</td>
</tr>
<tr>
<td valign="middle" align="left">M1</td>
<td valign="middle" align="left">21.7%</td>
<td valign="middle" align="left">6.7%</td>
</tr>
<tr>
<th valign="middle" colspan="3" align="left">Post-op GS (ISUP)</th>
</tr>
<tr>
<td valign="middle" align="left">2-6 (I)</td>
<td valign="middle" align="left">27.0%</td>
<td valign="middle" align="left">4.9%</td>
</tr>
<tr>
<td valign="middle" align="left">7 (II)</td>
<td valign="middle" align="left">20.5%</td>
<td valign="middle" align="left">31.0%</td>
</tr>
<tr>
<td valign="middle" align="left">7 (III)</td>
<td valign="middle" align="left">16.4%</td>
<td valign="middle" align="left">23.5%</td>
</tr>
<tr>
<td valign="middle" align="left">8 (IV)</td>
<td valign="middle" align="left">19.3%</td>
<td valign="middle" align="left">16.0%</td>
</tr>
<tr>
<td valign="middle" align="left">9-10 (V)</td>
<td valign="middle" align="left">16.8%</td>
<td valign="middle" align="left">24.5%</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>PSA, prostate-specific antigen; GS, Gleason score.</p></fn>
</table-wrap-foot>
</table-wrap>
</sec>
<sec id="s3_2">
<label>2.2</label>
<title>Overview of the study workflow</title>
<p>The workflow of the Prostate N stage prediction module is as follows and demonstrated in <xref ref-type="fig" rid="f2"><bold>Figure&#xa0;2</bold></xref>. The training dataset comprises H&amp;E-stained WSIs from the aforementioned cohorts, each labeled at the sample level according to pathological N stage (N0 or N1). Pathological images corresponding to each patient were collected from both cohorts. For the RHWU cohort, WSIs were digitized using a KF-PRO-020 digital slide scanner (KFBIO Co., Ltd.) at a magnification of 40&#xd7; (0.25 &#x3bc;m per pixel). Each WSI was uniformly divided into 256 &#xd7; 256 pixel patches, which were subsequently grouped into bags. These bags, together with their WSI-level N stage labels, served as input for training the MIL module. The trained model was then evaluated on both internal and external validation datasets, and its predicted N stages were compared against the pathologist-determined ground truth to assess performance and generalizability.</p>
<fig id="f2" position="float">
<label>Figure&#xa0;2</label>
<caption>
<p>Flow chat of pretraining foundational model-based feature extraction and multi-instance learning for N stage predict in prostate cancer.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-16-1775750-g002.tif">
<alt-text content-type="machine-generated">Flowchart illustrates an automated pathology workflow for lymph node staging, showing preprocessing and patching of histology images, feature encoding, extraction, attention mechanism, multi-class prediction, and evaluation with ROC and survival plots.</alt-text>
</graphic></fig>
</sec>
<sec id="s3_3">
<label>2.3</label>
<title>Preprocessing</title>
<p>For the RHWU cohort, H&amp;E slides were digitized using the digital slide scanner (KFBIO Co., Ltd., Ningbo, China) at 40&#xd7; magnification with a resolution of 0.12 &#x3bc;m/pixel. Images with quality issues such as air bubbles, uneven staining, severe fading, tissue folds, or out-of-focus areas were excluded from analysis. TCGA slides were obtained as pre-scanned digital images in SVS format. Each WSI was subdivided into non-overlapping patches of 256 &#xd7; 256 pixels following stain normalization using the Macenko method in order to minimize color variation across samples. Patches containing more than 80% background area were discarded, which is the empirical criterion threshold that aims to balance noise reduction with preservation of informative tissue regions, and the remaining patches were aggregated into bags, which served as the analytical units for subsequent MIL.</p>
</sec>
<sec id="s3_4">
<label>2.4</label>
<title>Feature extract and deep learning methods</title>
<p>To extract meaningful representations from the image patches, three distinct pretrained encoders were selected based on their complementary strengths for histopathological analysis. Each model offers a different paradigm for visual representation learning: (i) UNI-v2, a histopathology-specific foundation model, leverages a self-supervised DINOv2 framework trained on large-scale histopathological datasets, which makes it particularly adept at capturing domain-relevant morphological patterns and robust to tissue-level variations (<xref ref-type="bibr" rid="B14">14</xref>). (ii) CONCH, a vision-language foundation model, is pretrained on paired histopathology images and biomedical text, enabling it to encode not only visual features but also semantically rich contextual knowledge highly relevant to diagnostic pathology (<xref ref-type="bibr" rid="B15">15</xref>). (iii) ResNet-50, a widely used convolutional architecture pretrained on ImageNet, was included as a well-established and general-purpose baseline to provide a performance benchmark and assess the added value of domain-specific pretraining. Each 256 &#xd7; 256 patch was processed by the chosen encoder to yield a 1024- or 2048-dimensional feature vector, which were then aggregated at the whole-slide image (bag) level for downstream analysis (<xref ref-type="bibr" rid="B16">16</xref>).</p>
<p>The prediction of nodal involvement was performed using the Clustering-constrained Attention Multiple Instance Learning (CLAM) framework with a single-branch attention mechanism (clam-sb) (<xref ref-type="bibr" rid="B17">17</xref>). CLAM was selected over other MIL approaches (e.g., DSMIL, Transformer-based MIL) for several reasons. First, its gated attention mechanism is well-suited for histopathology tasks characterized by high intra-slide heterogeneity and weak supervision. Second, unlike Transformer-based MIL models which typically require larger datasets to avoid overfitting, CLAM has demonstrated robust performance on cohorts of moderate size comparable to ours. Third, CLAM explicitly models instance-level ambiguity by imposing clustering constraints, which helps identify both supportive and contradictory evidence within a slide, enhancing interpretability and robustness. Finally, CLAM provides direct visualization of attention scores, allowing transparent identification of the morphological regions most influential for the prediction, which aligns with our objective of model interpretability.</p>
<p>The RHWU cohort was used for model training and internal evaluation via five-fold cross-validation to preserve the class distribution in each fold during model development, with patients randomly assigned to training and test subsets in an 8:2 ratio. The TCGA-PRAD cohort served as an independent external validation set. Model performance was assessed at the patient level using multiple metrics, including accuracy, precision, recall, specificity, F1-score, and the area under the receiver operating characteristic curve (AUC), with 95% confidence intervals estimated by bootstrapping.</p>
<p>Feature extraction was performed using frozen pretrained encoders mentioned above. Encoder parameters were not fine-tuned during MIL training. Slide-level classification was optimized using a cross-entropy loss. The Adam optimizer was employed with an initial learning rate of 1 &#xd7; 10<sup>-4</sup>; and a weight decay of 1 &#xd7; 10<sup>-5</sup>. Training was conducted for a maximum of 20 epochs, and a dropout rate of 0.25 was applied to mitigate overfitting. Instance-level clustering was enabled without an explicit instance-level loss term. A total of eight representative instances (B = 8) were sampled from each bag during training, and the bag-level loss was weighted by a coefficient of 0.7. No class-weighted sampling strategy was applied at the patient level.</p>
</sec>
<sec id="s3_5">
<label>2.5</label>
<title>Visualization and interpretability</title>
<p>Model interpretability was examined through visualization of attention heatmaps. For a representative subset of cases (n=30 WSIs each from N0 and N1 groups, randomly selected), the tiles with the highest attention scores were extracted. These tiles, along with their corresponding low-attention control tiles from the same slide, were presented in a blinded and randomized order to two board-certified genitourinary pathologists. The pathologists were asked to qualitatively assess the presence of predefined histopathological features associated with aggressiveness (e.g., poorly differentiated clusters, nuclear atypia, stromal response) and to assign a subjective &#x201c;suspicion for metastasis&#x201d; score on a 3-point scale (low, intermediate, high).</p>
<p>To explore the potential molecular basis underlying the imaging-derived predictions, hypothesis-generating transcriptomic analyses were performed using RNA sequencing data from the TCGA-PRAD cohort. Patients were stratified according to pathological nodal status. Differential expression analysis was conducted using the edgeR package in R, with genes considered significant at an absolute log2 fold change greater than one and an adjusted p-value below 0.05. Identified differentially expressed genes (DEGs) were subjected to Gene Ontology (GO) and Kyoto Encyclopedia of Genes and Genomes (KEGG) enrichment analyses using the clusterProfiler package to elucidate the biological processes and pathways associated with nodal involvement. Genes strongly associated with nodal status were further evaluated for prognostic significance using Kaplan&#x2013;Meier survival analyses, with overall survival (OS) as primary endpoint.</p>
</sec>
<sec id="s3_6">
<label>2.6</label>
<title>Statistical analysis and hardware</title>
<p>All statistical analyses were carried out using R software (version 3.5.1), Python 3.7, and SPSS 25.0 software (IBM Corp., Armonk, NY). The diagnostic performance of each model was assessed using confusion matrixes, receiver operating characteristic (ROC) curves, and the area under the curve (AUC). Descriptive analyses were presented using MEAN &#xb1; SD. A two-sided p-value &lt; 0.05 was considered statistically significant. The training, testing, and inferring processes of the network were performed in PyTorch (Version 1.6, Python 3.8, Ubuntu 20.04.6 LTS, GeForce RTX4090).</p>
</sec>
<sec id="s3_7">
<label>2.7</label>
<title>Ethics approval and consent to participate</title>
<p>This study was conducted in accordance with the ethical standards of the Declaration of Helsinki and was approved by the RHWU Ethics Committee. Informed consent from the participants was waived by the institutional review board as the current study satisfied the following requirement for the waiver of informed consent: the research involved minimal risk to the participants.</p>
</sec>
</sec>
<sec id="s3" sec-type="results">
<label>3</label>
<title>Results</title>
<sec id="s4_1">
<label>3.1</label>
<title>Model development and predictive performance</title>
<p>The proposed foundation model&#x2013;based multi-instance learning framework successfully predicted nodal involvement in prostate cancer using H&amp;E-stained whole slide images. Across five-fold cross-validation in the RHWU cohort, all encoders achieved robust classification performance, with the UNI-v2 encoder consistently outperforming CONCH and ResNet-50. Specifically, the UNI-v2 model achieved an average AUC of 0.879 (95% CI 0.834&#x2013;0.920), accuracy of 81.4%, specificity of 73.0%, and F1 Score of 78.0%. By contrast, the CONCH-based model demonstrated an AUC of 0.833 (95% CI 0.786&#x2013;0.878), while the ResNet-50 baseline reached 0.837 (95% CI 0.786&#x2013;0.882). External validation on the TCGA cohort confirmed the generalizability of the models, with UNI-v2 again providing the strongest performance (AUC = 0.850, accuracy = 80.4%), followed by CONCH (AUC = 0.791) and ResNet-50 (AUC = 0.805). ROC and confusion matrix analysis illustrated consistent superiority of the UNI-v2 encoder across both datasets. The detailed results can be shown in <xref ref-type="table" rid="T2"><bold>Table&#xa0;2</bold></xref> and <xref ref-type="fig" rid="f3"><bold>Figure&#xa0;3</bold></xref>.</p>
<table-wrap id="T2" position="float">
<label>Table&#xa0;2</label>
<caption>
<p>The efficacy of different cohorts in identifying N involvement in prostate cancer patients.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" align="left">Cohort</th>
<th valign="middle" align="left">Model</th>
<th valign="middle" align="left">Acc</th>
<th valign="middle" align="left">Pre</th>
<th valign="middle" align="left">Recall</th>
<th valign="middle" align="left">Spe</th>
<th valign="middle" align="left">F1 Sco</th>
<th valign="middle" align="left">AUC</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="left">RHWU</td>
<td valign="middle" align="left">UNI-v2</td>
<td valign="middle" align="left">0.814</td>
<td valign="middle" align="left">0.730</td>
<td valign="middle" align="left">0.836</td>
<td valign="middle" align="left">0.800</td>
<td valign="middle" align="left">0.780</td>
<td valign="middle" align="left">0.879</td>
</tr>
<tr>
<td valign="middle" align="left"/>
<td valign="middle" align="left">CONCH</td>
<td valign="middle" align="left">0.754</td>
<td valign="middle" align="left">0.678</td>
<td valign="middle" align="left">0.709</td>
<td valign="middle" align="left">0.782</td>
<td valign="middle" align="left">0.693</td>
<td valign="middle" align="left">0.833</td>
</tr>
<tr>
<td valign="middle" align="left"/>
<td valign="middle" align="left">ResNet- 50</td>
<td valign="middle" align="left">0.764</td>
<td valign="middle" align="left">0.693</td>
<td valign="middle" align="left">0.718</td>
<td valign="middle" align="left">0.794</td>
<td valign="middle" align="left">0.705</td>
<td valign="middle" align="left">0.837</td>
</tr>
<tr>
<td valign="middle" align="left">TCGA</td>
<td valign="middle" align="left">UNI-v2</td>
<td valign="middle" align="left">0.804</td>
<td valign="middle" align="left">0.565</td>
<td valign="middle" align="left">0.722</td>
<td valign="middle" align="left">0.829</td>
<td valign="middle" align="left">0.634</td>
<td valign="middle" align="left">0.850</td>
</tr>
<tr>
<td valign="middle" align="left"/>
<td valign="middle" align="left">CONCH</td>
<td valign="middle" align="left">0.765</td>
<td valign="middle" align="left">0.554</td>
<td valign="middle" align="left">0.622</td>
<td valign="middle" align="left">0.817</td>
<td valign="middle" align="left">0.586</td>
<td valign="middle" align="left">0.791</td>
</tr>
<tr>
<td valign="middle" align="left"/>
<td valign="middle" align="left">ResNet- 50</td>
<td valign="middle" align="left">0.775</td>
<td valign="middle" align="left">0.576</td>
<td valign="middle" align="left">0.639</td>
<td valign="middle" align="left">0.825</td>
<td valign="middle" align="left">0.606</td>
<td valign="middle" align="left">0.805</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>Acc for accuracy, Pre for precision, Spe for Specificity, F1 Sco for F1 Score.</p></fn>
</table-wrap-foot>
</table-wrap>
<fig id="f3" position="float">
<label>Figure&#xa0;3</label>
<caption>
<p>ROC curves and confusion matrices of different cohorts.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-16-1775750-g003.tif">
<alt-text content-type="machine-generated">Two rows of data visualizations compare machine learning model performance. Each row contains one ROC curve plot on the left, showing three models’ curves and AUC values, followed by three confusion matrix heatmaps on the right for each model, labeled UNI, Conch, and ResNet50, presenting true and predicted labels in distinct color gradients for RHWU (top row) and TCGA (bottom row) datasets.</alt-text>
</graphic></fig>
</sec>
<sec id="s4_2">
<label>3.2</label>
<title>Interpretability analysis of attention mechanisms</title>
<p>To elucidate the histopathological features underlying model predictions, attention heatmaps were generated for each WSI (<xref ref-type="fig" rid="f4"><bold>Figure&#xa0;4</bold></xref>). Based on the attention heatmaps, we retrospectively qualitatively analyzed the spatial distribution patterns of different cases. In patients with N-positive status, high-attention regions were concentrated at tumor&#x2013;stroma interfaces, particularly in areas exhibiting poorly differentiated tumor clusters, nuclear pleomorphism, and mitotic activity. Stromal zones enriched with spindle-shaped fibroblasts and scattered lymphocytes were also frequently highlighted. Conversely, in N0 cases, the model focused on well-formed glandular structures with preserved polarity and minimal stromal reaction. Pathologist review of the top-ranked tiles confirmed the biological plausibility of the model&#x2019;s focus, suggesting that the framework captured morphologic correlates of nodal metastasis. Representative WSIs with corresponding heatmaps demonstrated the ability of the model to localize regions of histological aggressiveness that may serve as surrogates for metastatic potential.</p>
<fig id="f4" position="float">
<label>Figure&#xa0;4</label>
<caption>
<p>Representative whole slide images and attention heatmaps of N stage for prostate cancer patients. <bold>(A, B)</bold> N0 Patient, <bold>(C, D)</bold> N1 Patient <bold>(E, F)</bold> Patches of top 8 attention score.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-16-1775750-g004.tif">
<alt-text content-type="machine-generated">Composite figure showing histopathological slides labeled A and C, corresponding heatmap analyses labeled B and D, and two grids of microscopic tile images labeled E and F, each selected using blue arrows for further examination.</alt-text>
</graphic></fig>
</sec>
<sec id="s4_3">
<label>3.3</label>
<title>Differential gene expression and functional enrichment</title>
<p>To explore molecular correlates of nodal status, transcriptomic data from the TCGA cohort were analyzed in an exploratory, hypothesis-generating manner. A total of 94 genes were differentially expressed between N-positive and N-negative patients, based on thresholds of |log2 fold change| &gt; 1 and adjusted p-value &lt; 0.05. Volcano plot visualization demonstrated a distinct separation of upregulated and downregulated transcripts (<xref ref-type="fig" rid="f5"><bold>Figure&#xa0;5</bold></xref>).</p>
<fig id="f5" position="float">
<label>Figure&#xa0;5</label>
<caption>
<p>Volcano plot and KEGG enrichment analysis of DEGs.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-16-1775750-g005.tif">
<alt-text content-type="machine-generated">Panel A shows a volcano plot indicating significantly upregulated genes in red and downregulated genes in blue between groups N1 and N0, with labeled genes and significance legend. Panel B presents a bubble plot of KEGG pathways enriched among downregulated genes, with pathways such as neuroactive ligand-receptor interaction and calcium signaling ranked by gene ratio, bubble size for gene count, and color gradient for adjusted p-values. Panel C displays a similar bubble plot for upregulated genes, highlighting pathways like cytokine-cytokine receptor interaction and cell cycle, using the same visual scheme as panel B.</alt-text>
</graphic></fig>
<p>KEGG pathway analysis corroborated these findings (<xref ref-type="fig" rid="f5"><bold>Figure&#xa0;5</bold></xref>). Upregulated pathways in the N1 group included Cell cycle, Systemic lupus erythematosus, Cytokine&#x2013;cytokine receptor interaction, Neutrophil extracellular trap formation, and PI3K&#x2013;Akt signaling, highlighting the interplay between cell proliferation, immune modulation, and metastatic potential. Conversely, downregulated pathways were enriched in Neuroactive ligand&#x2013;receptor interaction, Calcium signaling, Adrenergic signaling in cardiomyocytes, and PPAR signaling, indicating suppression of neuroendocrine and metabolic functions in nodal disease.</p>
<p>Gene Ontology (GO) enrichment analysis revealed distinct functional patterns among upregulated and downregulated genes across the categories of molecular function (MF), biological process (BP), and cellular component (CC), as shown in <xref ref-type="fig" rid="f6"><bold>Figure&#xa0;6</bold></xref>. In terms of MF, the upregulated genes were mainly enriched in antigen binding, microtubule binding and motor activity, cytoskeletal motor activity, and peptidase inhibitor or regulator activity, indicating enhanced functions related to cytoskeletal dynamics and immune responses. Conversely, the downregulated genes were predominantly enriched in gated and voltage-gated ion channel activity, neurotransmitter receptor activity, and fatty acid or glycosaminoglycan binding, suggesting reduced transmembrane signaling and metabolic regulation.</p>
<fig id="f6" position="float">
<label>Figure&#xa0;6</label>
<caption>
<p>GO enrichment analysis and GO network of DEGs. <bold>(A-C)</bold> BP, MF, and CC of up regulated Genes; <bold>(D-F)</bold> BP, MF, and CC of dowm regulated Genes. <bold>(G, H)</bold> GO Enrichment Network of DEGs.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-16-1775750-g006.tif">
<alt-text content-type="machine-generated">Six bar charts labeled panels A to F show gene ontology enrichment analysis for upregulated and downregulated genes, divided by biological process, molecular function, and cellular component, with color bars indicating significance levels. Two network diagrams labeled panels G and H illustrate gene-pathway relationships for upregulated and downregulated genes, respectively, with edge connections and node size variation representing pathway involvement.</alt-text>
</graphic></fig>
<p>Regarding BP, the upregulated genes were significantly associated with regulation of membrane potential, muscle system processes and contraction, response and detoxification to metal ions (copper, zinc, cadmium), heart contraction and blood pressure regulation, and extracellular matrix organization. In contrast, the downregulated genes were also enriched in pathways related to membrane potential regulation, ion transport, muscle contraction, and neuronal activity, implying functional alterations in ion homeostasis and muscular signaling under the studied condition.</p>
<p>For CC, upregulated genes were primarily located in the immunoglobulin complex, chromosomal and spindle-associated structures (including centromeric regions, kinetochores, and microtubules), reflecting enhanced mitotic and immune-related activities. Downregulated genes, however, were mainly distributed in the sarcolemma, synaptic and postsynaptic membranes, sarcoplasmic reticulum, and ion channel complexes, highlighting suppression of ion transport and neuromuscular transmission.</p>
<p>Collectively, these findings indicate that upregulated genes are mainly involved in immune activation, chromatin organization, and cytoskeletal remodeling, whereas downregulated genes are primarily associated with ion channel regulation, neuronal signaling, and metabolic processes, suggesting complementary functional shifts in response to the biological context examined. These analyses were exploratory in nature and aimed at generating hypotheses regarding the molecular landscape associated with AI-predicted and pathologically confirmed nodal status.</p>
</sec>
<sec id="s4_4">
<label>3.4</label>
<title>Prognostic relevance of nodal-associated genes</title>
<p>To assess the clinical impact of nodal-associated molecular alterations, Kaplan&#x2013;Meier survival analyses were performed for selected DEGs with the strongest associations to nodal status (<xref ref-type="fig" rid="f7"><bold>Figure&#xa0;7</bold></xref>). Several genes, including PEBP4, TMEM121B, FAM107A, PRSS27, SRD5A2, INSM2, AQP5, USP32P3, and LGI3 exhibited significant correlations with reduced overall survival (log-rank p &lt; 0.01). These findings suggest a potential link between AI-identified morphological correlates of N stage and transcriptomic alterations associated with unfavorable prognosis. Further studies adjusting for clinical covariates are needed to validate the independent prognostic value of these genes.</p>
<fig id="f7" position="float">
<label>Figure&#xa0;7</label>
<caption>
<p>Kaplan&#x2013;Meier survival curves of prostate N stage associated genes.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-16-1775750-g007.tif">
<alt-text content-type="machine-generated">Set of nine Kaplan-Meier survival curves comparing high and low gene expression for PEBP4, TMEM121B, FAM107A, PRSS27, SRD5A2, INSM2, AQP5, USP32P3, and LGI3. Each graph shows overall survival over time in months, with distinct blue and red lines for high and low expression, respectively, p-values indicating statistical significance, and tables showing the number at risk below each plot.</alt-text>
</graphic></fig>
</sec>
</sec>
<sec id="s4" sec-type="discussion">
<label>4</label>
<title>Discussion</title>
<p>In this study, we developed and validated a pathology foundation model&#x2013;based MIL framework for predicting nodal involvement in prostate cancer directly from hematoxylin and eosin (H&amp;E)-stained whole slide images. Using a multicenter design incorporating both RHWU and TCGA cohorts, the proposed approach achieved high diagnostic accuracy, robust external generalizability, and meaningful biological interpretability. Beyond predictive performance, we further explored the molecular correlates of nodal status through integrative transcriptomic analyses, revealing differential gene expression patterns, functional enrichment in proliferative and invasive pathways, and immune infiltration profiles consistent with an immunosuppressive tumor microenvironment. Together, these findings underscore the potential of computational pathology to bridge histological morphology and tumor biology, offering clinically relevant insights into metastatic dissemination in prostate cancer.</p>
<p>Recent advances in computational pathology have demonstrated the potential of deep learning models to extract clinically relevant information directly from digitized histopathology slides. Deep learning models can automatically extract multi-level features from WSIs, enabling tissue region recognition, segmentation, and classification, thereby enhancing the automation and objectivity of prostate cancer pathology. Common CNN architectures such as U-Net, ResNet, VGG, and DenseNet have been widely applied to gland segmentation, tumor detection, and Gleason grading, achieving diagnostic consistency comparable to or exceeding that of pathologists (<xref ref-type="bibr" rid="B18">18</xref>&#x2013;<xref ref-type="bibr" rid="B21">21</xref>). End-to-end deep learning approaches allow semantic segmentation and lesion classification directly from prostate histopathology images. U-Net and its variants perform well in gland and tumor segmentation, with Dice scores exceeding 0.90. Patch-based multi-layer CNNs can detect prostate cancer, assign Gleason grades, and assess perineural invasion, achieving AUC values up to 0.99. Moreover, weakly supervised and MIL methods effectively mitigate limited annotation issues, enabling high-performance tumor recognition using only slide-level labels (<xref ref-type="bibr" rid="B22">22</xref>&#x2013;<xref ref-type="bibr" rid="B25">25</xref>). Self-supervised pre-trained foundation models for pathology, such as UNI, CONCH, and Virchow, have emerged as a research focus. Trained on massive cross-organ and cross-staining WSI datasets, these models possess strong feature extraction and generalization capabilities, achieving high downstream task performance with minimal annotated data. They support not only tumor detection and grading but also pathology report generation, image-text matching, and zero-shot retrieval, representing a systematic and platform-level advancement of AI in pathology.</p>
<p>MIL frameworks, including attention-based, CLAM-based approaches, DSMIL (<xref ref-type="bibr" rid="B26">26</xref>), and Transformer-based (<xref ref-type="bibr" rid="B27">27</xref>), have been successfully applied to predict key clinical endpoints such as lymph node metastasis, Gleason grading, and biochemical recurrence in prostate cancer, often achieving performance comparable to or exceeding that of human experts (<xref ref-type="bibr" rid="B25">25</xref>, <xref ref-type="bibr" rid="B28">28</xref>, <xref ref-type="bibr" rid="B29">29</xref>). We deliberately selected CLAM for the present study for several methodological and practical reasons. First, CLAM explicitly models instance-level heterogeneity within WSIs, which is particularly suitable for histopathology tasks characterized by weak supervision. Second, compared with Transformer-based MIL approaches, CLAM offers a more favorable trade-off between modeling capacity and data requirements. Transformer-based MIL models typically require substantially larger training cohorts to avoid overfitting, whereas CLAM has been shown to perform reliably on datasets of moderate size. Third, CLAM provides interpretability advantages through its attention scores and instance-level sampling strategy, allowing visualization of regions contributing most strongly to slide-level predictions.</p>
<p>Our results highlight several key contributions. First, the incorporation of domain-adapted foundation models, particularly the UNI-v2 encoder, substantially improved predictive performance compared to conventional ImageNet-pretrained backbones. This finding is consistent with emerging evidence that large-scale self-supervised learning on histopathology datasets yields representations that better capture the nuanced morphology of tumor tissue. Second, the use of CLAM-based MIL provided a weakly supervised yet interpretable framework for slide-level prediction. Unlike traditional convolutional neural networks, which often require extensive region-level annotations, our approach leveraged only slide-level labels while retaining spatial interpretability via attention heatmaps. These heatmaps consistently identified regions enriched in histological hallmarks of metastatic propensity, including nuclear atypia, poorly differentiated tumor clusters, and tumor&#x2013;stromal interactions, which were corroborated by expert pathologists. Such interpretability is critical for clinical translation, as it allows pathologists to validate AI-driven predictions within established diagnostic paradigms.</p>
<p>The transcriptomic analyses, while exploratory, provided a valuable molecular context. Integrative bioinformatics analyses further contextualized the imaging-derived predictions. Differential expression analysis indicated that N-positive tumors exhibited transcriptomic alterations associated with metastatic potential. Specifically, several genes, including PEBP4, TMEM121B, FAM107A, PRSS27, SRD5A2, INSM2, AQP5, USP32P3, and LGI3, were significantly correlated with reduced overall survival (log-rank p &lt; 0.01), highlighting their potential roles in disease progression, but the prognostic implications of the identified genes require validation in independent cohorts with multivariable models that account for standard clinical and pathological risk factors. These findings suggest that AI-identified morphological features of N stage are reflected at the molecular level. In addition, enrichment analyses revealed perturbations in pathways related to cell cycle regulation and extracellular matrix remodeling, consistent with mechanisms promoting tumor invasion and lymphatic dissemination.</p>
<p>In current clinical practice, lymph node involvement is primarily assessed through pelvic lymph node dissection (PLND) and imaging modalities such as PSMA-PET. When compared with existing clinical modalities for N staging, including MRI and PSMA-PET, our framework demonstrates several advantages. Imaging-based assessments, although non-invasive, often suffer from limited sensitivity, especially in detecting micrometastatic nodal disease. Histopathology remains the gold standard, yet manual review is labor-intensive and subject to inter-observer variability. By leveraging digitized WSIs and AI-based analysis, our approach provides a scalable and reproducible alternative that complements conventional diagnostics. Moreover, unlike imaging modalities that require specialized equipment and tracers, computational pathology can be implemented on widely available digital slides, facilitating broader clinical adoption. Despite the model&#x2019;s high overall accuracy, false negatives could miss patients with lymph node involvement, while false positives might trigger unnecessary diagnostic procedures. Our model is best suited as a risk-stratification tool to identify low-risk patients, not as a definitive diagnostic, and that the operating threshold should be adjusted based on the clinical context&#x2014;prioritizing sensitivity when ruling out metastasis is critical.</p>
<p>Despite its strengths, this study has limitations that warrant consideration. First, the RHWU cohort, although carefully curated, remains of modest size relative to the heterogeneity of prostate cancer. Larger, multicenter cohorts will be needed to further validate generalizability across populations and institutions. Second, while our attention-based interpretability offers valuable spatial insights, functional validation of highlighted regions was not performed, leaving the causal link between histological features and metastatic behavior to be further explored. Third, class imbalance is an inherent challenge in MIL tasks. Imbalance occurs at multiple levels, including the bag (patient/WSI) level and the instance patch level, where only a small fraction of patches within positive slides are truly discriminative, and the spatial level, where large areas of background or non-neoplastic tissue coexist with relatively sparse tumor or invasive regions. The TCGA cohort showed a less favorable class distribution, though the model was trained primarily on the RHWU cohort, which exhibited a relatively balanced class distribution and included a sufficient number of cases to support robust model training and feature learning, and its performance remained stable during external validation, suggesting that the learned representations were not overly driven by class frequency bias. Fourth, the RHWU training cohort has a higher proportion of locally advanced cases compared with the TCGA cohort. While this cohort heterogeneity may reflect real-world clinical practice, differences in case composition, stage distribution, and surgical strategies between cohorts could influence the generalizability of our model. Fifth, although transcriptomic analyses provided biological context, additional multi-omic integration (including genomics, epigenomics, and proteomics) could yield a more comprehensive understanding of metastatic progression. Finally, prospective evaluation in real-world diagnostic workflows will be essential to assess clinical utility, pathologist acceptance, and cost-effectiveness.</p>
<p>Looking ahead, several directions may enhance the translational potential of our framework. Expanding the sample size through multi-center data collection and incorporating explicit imbalance-aware strategies, such as class-weighted loss functions within the MIL classification objective. Incorporating multi-modal data, such as radiomics, clinical variables, and genomic alterations, could improve predictive accuracy and enable more personalized risk stratification. Expanding the scope to predict other clinically relevant endpoints, including biochemical recurrence, distant metastasis, and treatment response, may further increase clinical value. Moreover, the development of user-friendly interfaces that visualize AI-generated risk maps alongside pathology slides will facilitate integration into routine diagnostic practice and foster collaborative human&#x2013;AI decision-making.</p>
</sec>
<sec id="s5" sec-type="conclusions">
<label>5</label>
<title>Conclusion</title>
<p>We present a robust and interpretable artificial intelligence framework that integrates pathology foundation models with multi-instance learning to predict nodal involvement in prostate cancer. Leveraging large-scale histopathology datasets from RHWU and TCGA, our approach demonstrated strong predictive performance, external generalizability, and meaningful biological interpretability. Transcriptomic and bio information analyses further revealed molecular mechanisms underlying nodal metastasis, highlighting potential biomarkers and therapeutic targets. These findings support the clinical potential of computational pathology as a decision-support tool for precision oncology, offering a scalable, reproducible, and biologically informed approach to prostate cancer staging and management.</p>
</sec>
</body>
<back>
<sec id="s6" sec-type="data-availability">
<title>Data availability statement</title>
<p>The original contributions presented in the study are included in the article/supplementary material. Further inquiries can be directed to the corresponding author.</p></sec>
<sec id="s7" sec-type="ethics-statement">
<title>Ethics statement</title>
<p>The studies involving humans were approved by Renmin Hospital of Wuhan University Ethics Committee. The studies were conducted in accordance with the local legislation and institutional requirements. The participants provided their written informed consent to participate in this study.</p></sec>
<sec id="s8" sec-type="author-contributions">
<title>Author contributions</title>
<p>GZ: Validation, Conceptualization, Software, Supervision, Formal analysis, Data curation, Writing &#x2013; original draft, Methodology. WL: Formal analysis, Writing &#x2013; original draft, Project administration, Methodology, Data curation, Software, Validation, Supervision. HM: Formal analysis, Writing &#x2013; original draft, Software, Data curation, Resources, Methodology. RD: Methodology, Project administration, Conceptualization, Visualization, Validation, Funding acquisition, Resources, Investigation, Formal analysis, Writing &#x2013; review &amp; editing.</p></sec>
<sec id="s10" sec-type="COI-statement">
<title>Conflict of interest</title>
<p>The author(s) declared that this work was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p></sec>
<sec id="s11" sec-type="ai-statement">
<title>Generative AI statement</title>
<p>The author(s) declared that generative AI was not used in the creation of this manuscript.</p>
<p>Any alternative text (alt text) provided alongside figures in this article has been generated by Frontiers with the support of artificial intelligence and reasonable efforts have been made to ensure accuracy, including review by the authors wherever possible. If you identify any issues, please contact us.</p></sec>
<sec id="s12" sec-type="disclaimer">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p></sec>
<ref-list>
<title>References</title>
<ref id="B1">
<label>1</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Sekhoacha</surname> <given-names>M</given-names></name>
<name><surname>Riet</surname> <given-names>K</given-names></name>
<name><surname>Motloung</surname> <given-names>P</given-names></name>
<name><surname>Gumenku</surname> <given-names>L</given-names></name>
<name><surname>Adegoke</surname> <given-names>A</given-names></name>
<name><surname>Mashele</surname> <given-names>S</given-names></name>
</person-group>. 
<article-title>Prostate cancer review: genetics, diagnosis, treatment options, and alternative approaches</article-title>. <source>Molecules</source>. (<year>2022</year>) <volume>27</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/molecules27175730</pub-id>, PMID: <pub-id pub-id-type="pmid">36080493</pub-id>
</mixed-citation>
</ref>
<ref id="B2">
<label>2</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Siegel</surname> <given-names>RL</given-names></name>
<name><surname>Kratzer</surname> <given-names>TB</given-names></name>
<name><surname>Giaquinto</surname> <given-names>AN</given-names></name>
<name><surname>Sung</surname> <given-names>H</given-names></name>
<name><surname>Jemal</surname> <given-names>A</given-names></name>
</person-group>. 
<article-title>Cancer statistics, 2025</article-title>. <source>CA: A Cancer J Clin</source>. (<year>2025</year>) <volume>75</volume>:<fpage>10</fpage>&#x2013;<lpage>45</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.3322/caac.21871</pub-id>, PMID: <pub-id pub-id-type="pmid">39817679</pub-id>
</mixed-citation>
</ref>
<ref id="B3">
<label>3</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Nateghi</surname> <given-names>R</given-names></name>
<name><surname>Zhou</surname> <given-names>R</given-names></name>
<name><surname>Saft</surname> <given-names>M</given-names></name>
<name><surname>Schnauss</surname> <given-names>M</given-names></name>
<name><surname>Neill</surname> <given-names>C</given-names></name>
<name><surname>Alam</surname> <given-names>R</given-names></name>
<etal/>
</person-group>. 
<article-title>AI-driven screening of equivocal prostate IHC cases: development and validation of a screening and cancer detection framework</article-title>. <source>Mod Pathol</source>. (<year>2025</year>), <fpage>100904</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.modpat.2025.100904</pub-id>, PMID: <pub-id pub-id-type="pmid">41043642</pub-id>
</mixed-citation>
</ref>
<ref id="B4">
<label>4</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Cornford</surname> <given-names>P</given-names></name>
<name><surname>van den Bergh</surname> <given-names>RCN</given-names></name>
<name><surname>Briers</surname> <given-names>E</given-names></name>
<name><surname>Van den Broeck</surname> <given-names>T</given-names></name>
<name><surname>Brunckhorst</surname> <given-names>O</given-names></name>
<name><surname>Darraugh</surname> <given-names>J</given-names></name>
<etal/>
</person-group>. 
<article-title>EAU-EANM-ESTRO-ESUR-ISUP-SIOG guidelines on prostate cancer-2024 update. Part I: screening, diagnosis, and local treatment with curative intent</article-title>. <source>Eur Urol</source>. (<year>2024</year>) <volume>86</volume>:<page-range>148&#x2013;63</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.eururo.2024.03.027</pub-id>, PMID: <pub-id pub-id-type="pmid">38614820</pub-id>
</mixed-citation>
</ref>
<ref id="B5">
<label>5</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Heidenreich</surname> <given-names>A</given-names></name>
<name><surname>Varga</surname> <given-names>Z</given-names></name>
<name><surname>Von Knobloch</surname> <given-names>R</given-names></name>
</person-group>. 
<article-title>Extended pelvic lymphadenectomy in patients undergoing radical prostatectomy: high incidence of lymph node metastasis</article-title>. <source>J Urol</source>. (<year>2002</year>) <volume>167</volume>:<page-range>1681&#x2013;6</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/S0022-5347(05)65177-4</pub-id>
</mixed-citation>
</ref>
<ref id="B6">
<label>6</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>D&#x2019;Rummo</surname> <given-names>KA</given-names></name>
<name><surname>Chen</surname> <given-names>RC</given-names></name>
<name><surname>Shen</surname> <given-names>X</given-names></name>
</person-group>. 
<article-title>Narrative review of management strategies and outcomes in node-positive prostate cancer</article-title>. <source>Transl Androl Urol</source>. (<year>2021</year>) <volume>10</volume>:<page-range>3176&#x2013;87</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.21037/tau-20-1031</pub-id>, PMID: <pub-id pub-id-type="pmid">34430420</pub-id>
</mixed-citation>
</ref>
<ref id="B7">
<label>7</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Daouacher</surname> <given-names>G</given-names></name>
<name><surname>Carlsson</surname> <given-names>J</given-names></name>
<name><surname>Voulgarakis</surname> <given-names>N</given-names></name>
<name><surname>Papageorgiou</surname> <given-names>S</given-names></name>
<name><surname>Dahlman</surname> <given-names>P</given-names></name>
<name><surname>Sundqvist</surname> <given-names>P</given-names></name>
<etal/>
</person-group>. 
<article-title>Diagnostic performance of conventional MRI using T1W and T2W for primary lymph node staging in intermediate- and high-risk prostate cancer patients prior to pelvic lymph node dissection</article-title>. <source>Abdom Radiol (NY)</source>. (<year>2025</year>) <volume>51</volume>(<issue>1</issue>):<fpage>206</fpage>&#x2013;<lpage>13</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s00261-025-05073-w</pub-id>, PMID: <pub-id pub-id-type="pmid">40576663</pub-id>
</mixed-citation>
</ref>
<ref id="B8">
<label>8</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Hope</surname> <given-names>TA</given-names></name>
<name><surname>Eiber</surname> <given-names>M</given-names></name>
<name><surname>Armstrong</surname> <given-names>WR</given-names></name>
<name><surname>Juarez</surname> <given-names>R</given-names></name>
<name><surname>Murthy</surname> <given-names>V</given-names></name>
<name><surname>Lawhn-Heath</surname> <given-names>C</given-names></name>
<etal/>
</person-group>. 
<article-title>Diagnostic accuracy of 68Ga-PSMA-11 PET for pelvic nodal metastasis detection prior to radical prostatectomy and pelvic lymph node dissection: A multicenter prospective phase 3 imaging trial</article-title>. <source>JAMA Oncol</source>. (<year>2021</year>) <volume>7</volume>:<page-range>1635&#x2013;42</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1001/jamaoncol.2021.3771</pub-id>, PMID: <pub-id pub-id-type="pmid">34529005</pub-id>
</mixed-citation>
</ref>
<ref id="B9">
<label>9</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Marra</surname> <given-names>G</given-names></name>
<name><surname>Valerio</surname> <given-names>M</given-names></name>
<name><surname>Heidegger</surname> <given-names>I</given-names></name>
<name><surname>Tsaur</surname> <given-names>I</given-names></name>
<name><surname>Mathieu</surname> <given-names>R</given-names></name>
<name><surname>Ceci</surname> <given-names>F</given-names></name>
<etal/>
</person-group>. 
<article-title>Management of patients with node-positive prostate cancer at radical prostatectomy and pelvic lymph node dissection: A systematic review</article-title>. <source>Eur Urol Oncol</source>. (<year>2020</year>) <volume>3</volume>:<page-range>565&#x2013;81</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.euo.2020.08.005</pub-id>, PMID: <pub-id pub-id-type="pmid">32933887</pub-id>
</mixed-citation>
</ref>
<ref id="B10">
<label>10</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Yu</surname> <given-names>KH</given-names></name>
<name><surname>Healey</surname> <given-names>E</given-names></name>
<name><surname>Leong</surname> <given-names>TY</given-names></name>
<name><surname>Kohane</surname> <given-names>IS</given-names></name>
<name><surname>Manrai</surname> <given-names>AK</given-names></name>
</person-group>. 
<article-title>Medical artificial intelligence and human values</article-title>. <source>N Engl J Med</source>. (<year>2024</year>) <volume>390</volume>:<page-range>1895&#x2013;904</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1056/NEJMra2214183</pub-id>, PMID: <pub-id pub-id-type="pmid">38810186</pub-id>
</mixed-citation>
</ref>
<ref id="B11">
<label>11</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Gadermayr</surname> <given-names>M</given-names></name>
<name><surname>Tschuchnig</surname> <given-names>M</given-names></name>
</person-group>. 
<article-title>Multiple instance learning for digital pathology: A review of the state-of-the-art, limitations &amp; future potential</article-title>. <source>Computerized Med Imaging Graphics</source>. (<year>2024</year>) <volume>112</volume>:<fpage>102337</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.compmedimag.2024.102337</pub-id>, PMID: <pub-id pub-id-type="pmid">38228020</pub-id>
</mixed-citation>
</ref>
<ref id="B12">
<label>12</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Quellec</surname> <given-names>G</given-names></name>
<name><surname>Cazuguel</surname> <given-names>G</given-names></name>
<name><surname>Cochener</surname> <given-names>B</given-names></name>
<name><surname>Lamard</surname> <given-names>M</given-names></name>
</person-group>. 
<article-title>Multiple-instance learning for medical image and video analysis</article-title>. <source>IEEE Rev BioMed Eng</source>. (<year>2017</year>) <volume>10</volume>:<page-range>213&#x2013;34</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1109/RBME.2017.2651164</pub-id>, PMID: <pub-id pub-id-type="pmid">28092576</pub-id>
</mixed-citation>
</ref>
<ref id="B13">
<label>13</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Moreno</surname> <given-names>CS</given-names></name>
<name><surname>Winham</surname> <given-names>CL</given-names></name>
<name><surname>Alemozaffar</surname> <given-names>M</given-names></name>
<name><surname>Klein</surname> <given-names>ER</given-names></name>
<name><surname>Lawal</surname> <given-names>IO</given-names></name>
<name><surname>Abiodun-Ojo</surname> <given-names>OA</given-names></name>
<etal/>
</person-group>. 
<article-title>Integrated genomic analysis of primary prostate tumor foci and corresponding lymph node metastases identifies mutations and pathways associated with metastasis</article-title>. <source>Cancers (Basel)</source>. (<year>2023</year>) <volume>15</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/cancers15235671</pub-id>, PMID: <pub-id pub-id-type="pmid">38067373</pub-id>
</mixed-citation>
</ref>
<ref id="B14">
<label>14</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Chen</surname> <given-names>RJ</given-names></name>
<name><surname>Ding</surname> <given-names>T</given-names></name>
<name><surname>Lu</surname> <given-names>MY</given-names></name>
<name><surname>Williamson</surname> <given-names>DFK</given-names></name>
<name><surname>Jaume</surname> <given-names>G</given-names></name>
<name><surname>Song</surname> <given-names>AH</given-names></name>
<etal/>
</person-group>. 
<article-title>Towards a general-purpose foundation model for computational pathology</article-title>. <source>Nat Med</source>. (<year>2024</year>) <volume>30</volume>:<page-range>850&#x2013;62</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41591-024-02857-3</pub-id>, PMID: <pub-id pub-id-type="pmid">38504018</pub-id>
</mixed-citation>
</ref>
<ref id="B15">
<label>15</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Lu</surname> <given-names>MY</given-names></name>
<name><surname>Chen</surname> <given-names>B</given-names></name>
<name><surname>Williamson</surname> <given-names>DFK</given-names></name>
<name><surname>Chen</surname> <given-names>RJ</given-names></name>
<name><surname>Liang</surname> <given-names>I</given-names></name>
<name><surname>Ding</surname> <given-names>T</given-names></name>
<etal/>
</person-group>. 
<article-title>A visual-language foundation model for computational pathology</article-title>. <source>Nat Med</source>. (<year>2024</year>) <volume>30</volume>:<page-range>863&#x2013;74</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41591-024-02856-4</pub-id>, PMID: <pub-id pub-id-type="pmid">38504017</pub-id>
</mixed-citation>
</ref>
<ref id="B16">
<label>16</label>
<mixed-citation publication-type="confproc">
<person-group person-group-type="author">
<name><surname>He</surname> <given-names>K</given-names></name>
<name><surname>Zhang</surname> <given-names>X</given-names></name>
<name><surname>Ren</surname> <given-names>S</given-names></name>
<name><surname>Sun</surname> <given-names>J</given-names></name>
</person-group>. (<year>2016</year>). 
<article-title>Deep residual learning for image recognition</article-title>, in: <conf-name>Proceedings of the IEEE conference on computer vision and pattern recognition</conf-name>, <publisher-loc>Las Vegas, NV, USA</publisher-loc>: 
<publisher-name>IEEE</publisher-name>. <fpage>770</fpage>&#x2013;<lpage>8</lpage>.
</mixed-citation>
</ref>
<ref id="B17">
<label>17</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Lu</surname> <given-names>MY</given-names></name>
<name><surname>Williamson</surname> <given-names>DFK</given-names></name>
<name><surname>Chen</surname> <given-names>TY</given-names></name>
<name><surname>Chen</surname> <given-names>RJ</given-names></name>
<name><surname>Barbieri</surname> <given-names>M</given-names></name>
<name><surname>Mahmood</surname> <given-names>F</given-names></name>
</person-group>. 
<article-title>Data-efficient and weakly supervised computational pathology on whole-slide images</article-title>. <source>Nat BioMed Eng</source>. (<year>2021</year>) <volume>5</volume>:<page-range>555&#x2013;70</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41551-020-00682-w</pub-id>, PMID: <pub-id pub-id-type="pmid">33649564</pub-id>
</mixed-citation>
</ref>
<ref id="B18">
<label>18</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Ren</surname> <given-names>J</given-names></name>
<name><surname>Sadimin</surname> <given-names>E</given-names></name>
<name><surname>Foran</surname> <given-names>DJ</given-names></name>
<name><surname>Qi</surname> <given-names>X</given-names></name>
</person-group>. 
<article-title>Computer aided analysis of prostate histopathology images to support a refined Gleason grading system</article-title>. <source>Proc SPIE Int Soc Opt Eng</source>. (<year>2017</year>) <volume>10133</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.1117/12.2253887</pub-id>, PMID: <pub-id pub-id-type="pmid">30828124</pub-id>
</mixed-citation>
</ref>
<ref id="B19">
<label>19</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Li</surname> <given-names>W</given-names></name>
<name><surname>Li</surname> <given-names>J</given-names></name>
<name><surname>Sarma</surname> <given-names>KV</given-names></name>
<name><surname>Ho</surname> <given-names>KC</given-names></name>
<name><surname>Shen</surname> <given-names>S</given-names></name>
<name><surname>Knudsen</surname> <given-names>BS</given-names></name>
<etal/>
</person-group>. 
<article-title>Path R-CNN for prostate cancer diagnosis and gleason grading of histological images</article-title>. <source>IEEE Trans Med Imaging</source>. (<year>2019</year>) <volume>38</volume>:<page-range>945&#x2013;54</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1109/TMI.2018.2875868</pub-id>, PMID: <pub-id pub-id-type="pmid">30334752</pub-id>
</mixed-citation>
</ref>
<ref id="B20">
<label>20</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Salvi</surname> <given-names>M</given-names></name>
<name><surname>Bosco</surname> <given-names>M</given-names></name>
<name><surname>Molinaro</surname> <given-names>L</given-names></name>
<name><surname>Gambella</surname> <given-names>A</given-names></name>
<name><surname>Papotti</surname> <given-names>M</given-names></name>
<name><surname>Acharya</surname> <given-names>UR</given-names></name>
<etal/>
</person-group>. 
<article-title>A hybrid deep learning approach for gland segmentation in prostate histopathological images</article-title>. <source>Artif Intell Med</source>. (<year>2021</year>) <volume>115</volume>:<fpage>102076</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.artmed.2021.102076</pub-id>, PMID: <pub-id pub-id-type="pmid">34001325</pub-id>
</mixed-citation>
</ref>
<ref id="B21">
<label>21</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Silva-Rodr&#xed;guez</surname> <given-names>J</given-names></name>
<name><surname>Colomer</surname> <given-names>A</given-names></name>
<name><surname>Naranjo</surname> <given-names>V</given-names></name>
</person-group>. 
<article-title>WeGleNet: A weakly-supervised convolutional neural network for the semantic segmentation of Gleason grades in prostate histology images</article-title>. <source>Comput Med Imaging Graph</source>. (<year>2021</year>) <volume>88</volume>:<fpage>101846</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.compmedimag.2020.101846</pub-id>, PMID: <pub-id pub-id-type="pmid">33485056</pub-id>
</mixed-citation>
</ref>
<ref id="B22">
<label>22</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Pantanowitz</surname> <given-names>L</given-names></name>
<name><surname>Quiroga-Garza</surname> <given-names>GM</given-names></name>
<name><surname>Bien</surname> <given-names>L</given-names></name>
<name><surname>Heled</surname> <given-names>R</given-names></name>
<name><surname>Laifenfeld</surname> <given-names>D</given-names></name>
<name><surname>Linhart</surname> <given-names>C</given-names></name>
<etal/>
</person-group>. 
<article-title>An artificial intelligence algorithm for prostate cancer diagnosis in whole slide images of core needle biopsies: a blinded clinical validation and deployment study</article-title>. <source>Lancet Digit Health</source>. (<year>2020</year>) <volume>2</volume>:<page-range>e407&#x2013;e16</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/S2589-7500(20)30159-X</pub-id>, PMID: <pub-id pub-id-type="pmid">33328045</pub-id>
</mixed-citation>
</ref>
<ref id="B23">
<label>23</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Bulten</surname> <given-names>W</given-names></name>
<name><surname>Pinckaers</surname> <given-names>H</given-names></name>
<name><surname>van Boven</surname> <given-names>H</given-names></name>
<name><surname>Vink</surname> <given-names>R</given-names></name>
<name><surname>de Bel</surname> <given-names>T</given-names></name>
<name><surname>van Ginneken</surname> <given-names>B</given-names></name>
<etal/>
</person-group>. 
<article-title>Automated deep-learning system for Gleason grading of prostate cancer using biopsies: a diagnostic study</article-title>. <source>Lancet Oncol</source>. (<year>2020</year>) <volume>21</volume>:<page-range>233&#x2013;41</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/S1470-2045(19)30739-9</pub-id>, PMID: <pub-id pub-id-type="pmid">31926805</pub-id>
</mixed-citation>
</ref>
<ref id="B24">
<label>24</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Str&#xf6;m</surname> <given-names>P</given-names></name>
<name><surname>Kartasalo</surname> <given-names>K</given-names></name>
<name><surname>Olsson</surname> <given-names>H</given-names></name>
<name><surname>Solorzano</surname> <given-names>L</given-names></name>
<name><surname>Delahunt</surname> <given-names>B</given-names></name>
<name><surname>Berney</surname> <given-names>DM</given-names></name>
<etal/>
</person-group>. 
<article-title>Artificial intelligence for diagnosis and grading of prostate cancer in biopsies: a population-based, diagnostic study</article-title>. <source>Lancet Oncol</source>. (<year>2020</year>) <volume>21</volume>:<page-range>222&#x2013;32</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/S1470-2045(19)30738-7</pub-id>, PMID: <pub-id pub-id-type="pmid">31926806</pub-id>
</mixed-citation>
</ref>
<ref id="B25">
<label>25</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Campanella</surname> <given-names>G</given-names></name>
<name><surname>Hanna</surname> <given-names>MG</given-names></name>
<name><surname>Geneslaw</surname> <given-names>L</given-names></name>
<name><surname>Miraflor</surname> <given-names>A</given-names></name>
<name><surname>Werneck Krauss Silva</surname> <given-names>V</given-names></name>
<name><surname>Busam</surname> <given-names>KJ</given-names></name>
<etal/>
</person-group>. 
<article-title>Clinical-grade computational pathology using weakly supervised deep learning on whole slide images</article-title>. <source>Nat Med</source>. (<year>2019</year>) <volume>25</volume>:<page-range>1301&#x2013;9</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41591-019-0508-1</pub-id>, PMID: <pub-id pub-id-type="pmid">31308507</pub-id>
</mixed-citation>
</ref>
<ref id="B26">
<label>26</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Li</surname> <given-names>B</given-names></name>
<name><surname>Li</surname> <given-names>Y</given-names></name>
<name><surname>Eliceiri</surname> <given-names>KW</given-names></name>
</person-group>. 
<article-title>Dual-stream multiple instance learning network for whole slide image classification with self-supervised contrastive learning</article-title>. <source>Conf Comput Vis Pattern Recognit Workshops</source>. (<year>2021</year>) <volume>2021</volume>:<page-range>14318&#x2013;28</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1109/CVPR46437.2021.01409</pub-id>, PMID: <pub-id pub-id-type="pmid">35047230</pub-id>
</mixed-citation>
</ref>
<ref id="B27">
<label>27</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Shao</surname> <given-names>Z</given-names></name>
<name><surname>Bian</surname> <given-names>H</given-names></name>
<name><surname>Chen</surname> <given-names>Y</given-names></name>
<name><surname>Wang</surname> <given-names>Y</given-names></name>
<name><surname>Zhang</surname> <given-names>J</given-names></name>
<name><surname>Ji</surname> <given-names>X</given-names></name>
</person-group>. 
<article-title>Transmil: Transformer based correlated multiple instance learning for whole slide image classification</article-title>. <source>Adv Neural Inf Process systems</source>. (<year>2021</year>) <volume>34</volume>:<page-range>2136&#x2013;47</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.48550/arxiv.2106.00908</pub-id>, PMID: <pub-id pub-id-type="pmid">41363103</pub-id>
</mixed-citation>
</ref>
<ref id="B28">
<label>28</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Xiang</surname> <given-names>J</given-names></name>
<name><surname>Wang</surname> <given-names>X</given-names></name>
<name><surname>Wang</surname> <given-names>X</given-names></name>
<name><surname>Zhang</surname> <given-names>J</given-names></name>
<name><surname>Yang</surname> <given-names>S</given-names></name>
<name><surname>Yang</surname> <given-names>W</given-names></name>
<etal/>
</person-group>. 
<article-title>Automatic diagnosis and grading of Prostate Cancer with weakly supervised learning on whole slide images</article-title>. <source>Comput Biol Med</source>. (<year>2023</year>) <volume>152</volume>:<fpage>106340</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.compbiomed.2022.106340</pub-id>, PMID: <pub-id pub-id-type="pmid">36481762</pub-id>
</mixed-citation>
</ref>
<ref id="B29">
<label>29</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Wessels</surname> <given-names>F</given-names></name>
<name><surname>Schmitt</surname> <given-names>M</given-names></name>
<name><surname>Krieghoff-Henning</surname> <given-names>E</given-names></name>
<name><surname>Jutzi</surname> <given-names>T</given-names></name>
<name><surname>Worst</surname> <given-names>TS</given-names></name>
<name><surname>Waldbillig</surname> <given-names>F</given-names></name>
<etal/>
</person-group>. 
<article-title>Deep learning approach to predict lymph node metastasis directly from primary tumour histology in prostate cancer</article-title>. <source>BJU Int</source>. (<year>2021</year>) <volume>128</volume>:<page-range>352&#x2013;60</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/bju.15386</pub-id>, PMID: <pub-id pub-id-type="pmid">33706408</pub-id>
</mixed-citation>
</ref>
</ref-list>
<fn-group>
<fn id="n1" fn-type="custom" custom-type="edited-by">
<p>Edited by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/760431">Alexander Winter</ext-link>, Hospital Oldenburg, Germany</p></fn>
<fn id="n2" fn-type="custom" custom-type="reviewed-by">
<p>Reviewed by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/2940818">Francesco Prata</ext-link>, Campus Bio-Medico University Hospital, Italy</p>
<p><ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/3153785">Gamze Korkmaz Erdem</ext-link>, Kocaeli Universitesi Muhendislik Fakultesi, T&#xfc;rkiye</p></fn>
</fn-group>
<fn-group>
<fn fn-type="abbr" id="abbrev1">
<label>Abbreviations:</label>
<p>Prostate cancer, PCa; nodal involvement, N stage; computed tomography, CT; magnetic resonance imaging, MRI; prostate-specific membrane antigen positron emission tomography, PSMA-PET; pelvic lymph node dissection, PLND; Artificial intelligence, AI; whole slide images, WSIs; Multiple-Instance Learning, MIL; The Cancer Genome Atlas, TCGA; differentially expressed genes, DEGs; prostate-specific antigen, PSA; Clustering-constrained Attention Multiple Instance Learning, CLAM; Gene Ontology, GO; Kyoto Encyclopedia of Genes and Genomes, KEGG; overall survival, OS; receiver operating characteristic, ROC; area under the curve, AUC.</p>
</fn>
</fn-group>
</back>
</article>