<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="2.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Oncol.</journal-id>
<journal-title>Frontiers in Oncology</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Oncol.</abbrev-journal-title>
<issn pub-type="epub">2234-943X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fonc.2024.1488118</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Oncology</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Personalized three-year survival prediction and prognosis forecast by interpretable machine learning for pancreatic cancer patients: a population-based study and an external validation</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Teng</surname>
<given-names>Buwei</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Zhang</surname>
<given-names>Xiaofeng</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Ge</surname>
<given-names>Mingshu</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Miao</surname>
<given-names>Miao</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Li</surname>
<given-names>Wei</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="author-notes" rid="fn001">
<sup>*</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Ma</surname>
<given-names>Jun</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="author-notes" rid="fn001">
<sup>*</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2829398"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>Department of Hepatobiliary Surgery, The Affiliated Lianyungang Hospital of Xuzhou Medical University/The First People&#x2019;s Hospital of Lianyungang</institution>, <addr-line>Lianyungang</addr-line>, <country>China</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>Department of Imaging, The Affiliated Huai&#x2019;an Hospital of Xuzhou Medical University and the Second People&#x2019;s Hospital of Huai&#x2019;an</institution>, <addr-line>Huai&#x2019;an</addr-line>, <country>China</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>Edited by: Pengpeng Zhang, Nanjing Medical University, China</p>
</fn>
<fn fn-type="edited-by">
<p>Reviewed by: Luo Qiang, Children&#x2019;s Hospital of Chongqing Medical University, China</p>
<p>Zhaokai Zhou, First Affiliated Hospital of Zhengzhou University, China</p>
</fn>
<fn fn-type="corresp" id="fn001">
<p>*Correspondence: Jun Ma, <email xlink:href="mailto:drmajun234@163.com">drmajun234@163.com</email>; Wei Li, <email xlink:href="mailto:power8446@163.com">power8446@163.com</email>
</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>21</day>
<month>10</month>
<year>2024</year>
</pub-date>
<pub-date pub-type="collection">
<year>2024</year>
</pub-date>
<volume>14</volume>
<elocation-id>1488118</elocation-id>
<history>
<date date-type="received">
<day>29</day>
<month>08</month>
<year>2024</year>
</date>
<date date-type="accepted">
<day>19</day>
<month>09</month>
<year>2024</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2024 Teng, Zhang, Ge, Miao, Li and Ma</copyright-statement>
<copyright-year>2024</copyright-year>
<copyright-holder>Teng, Zhang, Ge, Miao, Li and Ma</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<sec>
<title>Purpose</title>
<p>The overall survival of patients with pancreatic cancer is extremely low. We aimed to establish machine learning (ML) based model to accurately predict three-year survival and prognosis of pancreatic cancer patients.</p>
</sec>
<sec>
<title>Methods</title>
<p>We analyzed pancreatic cancer patients from the Surveillance, Epidemiology, and End Results (SEER) database between 2000 and 2021. Univariate and multivariate logistic analysis were employed to select variables. Recursive Feature Elimination (RFE) method based on 6 ML algorithms was utilized in feature selection. To construct predictive model, 13 ML algorithms were evaluated by area under the curve (AUC), area under precision-recall curve (PRAUC), accuracy, sensitivity, specificity, precision, cross-entropy, Brier scores and Balanced Accuracy (bacc) and F Beta Score (fbeta). An optimal ML model was constructed to predict three-year survival, and the predictive results were explained by SHapley Additive exPlanations (SHAP) framework. Meanwhile, 101 ML algorithm combinations were developed to select the best model with highest C-index to predict prognosis of pancreatic cancer patients.</p>
</sec>
<sec>
<title>Results</title>
<p>A total of 20,064 pancreatic cancer patients from SEER database was consecutively enrolled. We utilized eight clinical variables to establish prediction model for three-year survival. CatBoost model was selected as the best prediction model, and AUC was 0.932 [0.924, 0.939], 0.899 [0.873, 0.934] and 0.826 [0.735, 0.919] in training, internal test and external test sets, with 0.839 [0.831, 0.847] accuracy, 0.872 [0.858, 0.887] sensitivity, 0.803 [0.784, 0.825] specificity and 0.832 [0.821, 0.853] precision. Surgery type had the greatest effects on three-year survival according to SHAP results. For prognosis prediction, &#x201c;RSF+GBM&#x201d; algorithm was the best prognostic model with C-index of 0.774, 0.722 and 0.674 in training, internal test and external test sets.</p>
</sec>
<sec>
<title>Conclusions</title>
<p>Our ML models demonstrate excellent accuracy and reliability, offering more precise personalized prognostic prediction to pancreatic cancer patients.</p>
</sec>
</abstract>
<kwd-group>
<kwd>machine learning</kwd>
<kwd>pancreatic cancer</kwd>
<kwd>three-year survival</kwd>
<kwd>prognosis prediction</kwd>
<kwd>SEER</kwd>
</kwd-group>
<counts>
<fig-count count="7"/>
<table-count count="3"/>
<equation-count count="0"/>
<ref-count count="36"/>
<page-count count="22"/>
<word-count count="9372"/>
</counts>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-in-acceptance</meta-name>
<meta-value>Cancer Immunity and Immunotherapy</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec id="s1" sec-type="intro">
<title>Introduction</title>
<p>Pancreatic cancer is a highly lethal disease with a dismal prognosis, and the 5-year survival rate is merely 9% (<xref ref-type="bibr" rid="B1">1</xref>). Only 1% of patients survive for 3 years or more after diagnosis of metastatic pancreatic cancer, while the incidence continues to climb steadily. Surgical resection is the only potential curative treatment, yet only a small proportion of pancreatic cancer patients are eligible for surgery at the time of initial diagnosis (<xref ref-type="bibr" rid="B2">2</xref>). This is largely because pancreatic cancer often lacks symptoms in its early stages, leading to most cases being diagnosed at an advanced stage (<xref ref-type="bibr" rid="B3">3</xref>). While some individuals may detect the disease through routine physical examinations and undergo early surgery, many patients still experience relapse and ultimately succumb to the disease (<xref ref-type="bibr" rid="B4">4</xref>). The treatment of pancreatic cancer mainly includes surgical resection, radiotherapy, chemotherapy and targeted therapy, but the overall efficacy is limited due to its high aggressiveness and the norm of late detection. Novel drugs targeting the KRAS gene, such as sotorasib and adagrasib, have demonstrated efficacy and tolerability in treating solid tumors, including pancreatic cancer, in clinical trials (<xref ref-type="bibr" rid="B5">5</xref>). Consequently, it is critical to promptly and early identify pancreatic cancer patients at high risk to optimize their treatment and improve prognosis. And exploring the prognostic risk factors for pancreatic cancer patients is crucial to assess their survival prospects.</p>
<p>Several biomarkers for prognosis prediction in pancreatic cancer have been identified in recent years, including CA19-9, circulating tumor DNA (ctDNA), microRNAs (miRNAs), and tumor mutational burden (TMB) (<xref ref-type="bibr" rid="B6">6</xref>). However, CA19-9 is not specific to pancreatic cancer and can be elevated in other conditions such as cholangitis, leading to false positives. Meanwhile, ctDNA analysis is limited by the low abundance of tumor DNA in the bloodstream, particularly in early-stage cancers, which may result in false negatives. And the clinical application of miRNAs is still in the early stages, and their stability in circulation poses challenges for reliable detection (<xref ref-type="bibr" rid="B7">7</xref>). Furthermore, TMB&#x2019;s predictive value is still under investigation, and its utility may vary depending on the genetic landscape of the tumor and the therapeutic context (<xref ref-type="bibr" rid="B8">8</xref>). Recently, nomogram based on Cox model has been widely utilized in cancer prognosis prediction, but its sensitivity and specificity may be insufficient, calling an urgent need for predicting prognosis more accurately and specifically. Machine learning (ML) approach, a subset of artificial intelligence, has become increasingly popular due to its ability to handle complex, non-linear relationships, particularly effective with vast datasets and loosely structured information (<xref ref-type="bibr" rid="B9">9</xref>). With the advent of big data analytics and ML, new approaches for screening risk factors affecting prognosis have become feasible. Several predictive models leveraging these technologies have shown excellent performance and are increasingly being integrated into clinical settings (<xref ref-type="bibr" rid="B10">10</xref>, <xref ref-type="bibr" rid="B11">11</xref>), while there is no ML-based sophisticated model to predict prognosis in pancreatic cancer so far, necessitating development and validation of a novel ML model.</p>
<p>The Surveillance, Epidemiology, and End Results (SEER) database (<ext-link ext-link-type="uri" xlink:href="https://seer.cancer.gov/">https://seer.cancer.gov/</ext-link>) is particularly valuable in this context, which encompasses a wide range of patient data, offering comprehensive clinicopathological statistics and follow-up information. This rich, real-world database is an ideal resource for developing and testing ML models in the medical field. However, it appears that there is still a gap in research specifically focused on developing models for three-year survival prediction and prognosis forecast of pancreatic cancer patients. Our study was committed to firstly developing and validating predictive and prognostic models utilizing multiple ML algorithms. This approach leverages extensive population data and the capabilities of ML, which is competent in providing personalized predictive tools that assist clinicians in effectively assessing the risk and prognosis of pancreatic cancer patients.</p>
</sec>
<sec id="s2" sec-type="materials|methods">
<title>Materials and methods</title>
<sec id="s2_1">
<title>Data source and characteristics</title>
<p>Clinicopathological data of patients with site recode ICD-O-3/WHO 2008 &#x201c;pancreas&#x201d; and AYA site recode 2020 Revision &#x201c;9.3.9.2 Pancreas &#x2013; adenocarcinoma&#x201d; between 2000 and 2021 was retrieved from the SEER database. Additionally, clinicopathological information of pancreatic The First People&#x2019;s Hospital of Lianyungang (2015&#x2013;2024) was retrospectively collected through electronic medical record system. The study was conducted according to the guidelines of the Declaration of Helsinki and was approved by the Ethics Committee of The First People&#x2019;s Hospital of Lianyungang (protocol code: KY-20210910004, approved on 2021-09-10). Informed consent was obtained from all subjects involved in this study. Inclusion criteria comprised individuals with ICD-O-3/WHO 2008 &#x201c;pancreas&#x201d; and AYA site recode 2020 Revision &#x201c;9.3.9.2 Pancreas &#x2013; adenocarcinoma&#x201d; which are older than 18 years old. Exclusion criteria comprised patients lacking follow-up information of survival months and death cause, not diagnosed with positive histology, no surgery information, not first malignant tumor, without TNM stage or grade details. In SEER database, metastasis is characterized by spreading to distant organs during the initial cancer diagnosis. And we define the outcome of predictive model as three-year survival, indicating that patients are still alive at the timepoint of 36 months follow-up. The positive outcome was death of patient in three-year follow-up.</p>
<p>Extracted data were gathered on demographic data (age, gender, race, marital status household location and income), cancer characteristics (pathological grade, summary stage, TNM stage, tumor size, tumor primary location, pathology, metastasis information), therapeutic information (surgery, lymph node surgery, positive lymph node, radiotherapy, chemotherapy) and follow-up information (overall and cancer-specific survival status, survival months). Two continuous variables, age and tumor size, were divided into categorical variables. The age was split into five groups: &#x201c;&lt;50&#x201d;, &#x201c;50-59&#x201d;, &#x201c;60-69&#x201d;, &#x201c;70-79&#x201d; and &#x201c;&gt;=80&#x201d;. The tumor size was split into &#x201c;&lt;2cm&#x201d;, &#x201c;2-3.9cm&#x201d;, &#x201c;4-5.9cm&#x201d;, &#x201c;6-7.9cm&#x201d;, &#x201c;&gt;8cm&#x201d; and &#x201c;Unknown&#x201d;. &#x201c;Metastasis&#x201d; was defined as &#x201c;yes&#x201d; with metastasis either in brain, bone, liver, lung, and distant lymph nodes, as well as tumor categorized as M1 stage. The missing rate for each categorical variable is calculated and reported. For those classified data that is unknown, we classify its missing value into the &#x201c;unknown&#x201d; category. This processing ensures data integrity and avoids information loss due to missing data. We determined the minimum sample size needed for an external validation cohort by formula of Riley et&#xa0;al. (<xref ref-type="bibr" rid="B12">12</xref>).</p>
</sec>
<sec id="s2_2">
<title>Establishment and validation of predictive model for three-year survival</title>
<p>In the preliminary analysis, variables with P &lt; 0.05 in the univariate and multivariate logistic analysis in the training set were included for the feature selection process. Subsequently, we employed Recursive Feature Elimination (RFE) method based on 6 ML algorithms, involving categorical boosting (CatBoost), random forest (RF), support vector machine (SVM), extreme gradient boosting (XGB), decision tree (DT) and gradient boosting machine (GBM), combined with 5-fold cross-validation, to sift through the clinical features. RFE works by building a model and identifying the most significant features in feature selection phase. This selection process is then iteratively repeated on the subset of remaining features until all features have been evaluated and ranked (<xref ref-type="bibr" rid="B13">13</xref>). Then Robust rank aggregation (RRA) algorithm was utilized to integrate the rank of variable importance from six ML algorithms utilized in RFE method to obtain a comprehensive ranking of all variables (<xref ref-type="bibr" rid="B14">14</xref>). We set random seed as &#x201c;2024&#x201d; in our analysis. In model development phase, we applied 13 ML algorithms, including CatBoost, RF, SVM, XGB, DT, GBM, k-nearest neighbor (KNN), logistic regression (LR), naive bayes classifier (NBC), linear discriminant analysis (LDA), quadratic discriminant analysis (QDA), neural network (NNET) and generalized linear model (GLM) to predict three-year survival via &#x201c;mlr3&#x201d; R package (<xref ref-type="bibr" rid="B15">15</xref>). This approach allows us to compare the performance of various models and select the best predictive model. To tackle the issue of class imbalance, which could significantly skew performance metrics, we implemented the Synthetic Minority Over-sampling Technique (SMOTE) for training our model (<xref ref-type="bibr" rid="B16">16</xref>). We further refined our approach by employing nested resampling, which involved a two-tiered k-fold cross-validation process: one for optimizing model hyperparameters and another nested within it for model selection. Meanwhile, we utilized a 1000-evaluation random search across a 5-fold cross-validation framework, repeated five times for each model. Subsequently, area under the curve (AUC), area under precision-recall curve (PRAUC), accuracy, sensitivity, specificity, precision, cross-entropy, Brier scores and Balanced Accuracy (bacc) and F Beta Score (fbeta) were calculated to select the best ML model. Internal validation was carried out through 5-fold cross-validation. Precision-recall curve (PRC) was employed to evaluate the performance of classification models in handling imbalanced datasets. Calibration curve was utilized to appraise model&#x2019;s discriminative ability, and decision curve analysis (DCA) was applied to verify the clinic benefit of ML model via &#x201c;runway&#x201d; R package (<ext-link ext-link-type="uri" xlink:href="https://github.com/ML4LHS/runway/">https://github.com/ML4LHS/runway/</ext-link>). We set the selection criteria of our best model: highest AUC, highest PRAUC, and lowest Brier score, while also ensuring a good calibration curve, as well as outperforming balanced accuracy and F Beta Score. To quantify the impact of each variable, we calculated its mean contribution to the AUC as a percentage relative to the full model via &#x201c;DALEX&#x201d; R package (<xref ref-type="bibr" rid="B17">17</xref>). SHapley Additive exPlanations (SHAP) value were used to explain the best model predictions and to interpret the black-box ML model via &#x201c;shapviz&#x201d; R package (<ext-link ext-link-type="uri" xlink:href="https://github.com/ModelOriented/shapviz">https://github.com/ModelOriented/shapviz</ext-link>) (<xref ref-type="bibr" rid="B18">18</xref>).</p>
</sec>
<sec id="s2_3">
<title>Prognostic model based on integrative machine learning algorithms</title>
<p>Univariate and multivariate cox analysis were employed to define clinical variables with significant prognosis value in overall survival (OS). We integrated 10 ML algorithms involving random survival forest (RSF), elastic network (Enet), Lasso, Ridge, stepwise Cox, CoxBoost, partial least squares regression for Cox (plsRcox), supervised principal components (SuperPC), GBM and survival support vector machine (survival-SVM) to predict prognosis (in terms of OS) of pancreatic cancer patients. Altogether 101 prognostic ML algorithm combinations were trained in the training cohort, to develop the prognostic ML model according to the leave-one-out cross-validation (LOOCV) framework. Models with &lt;3 clinical variable were removed. Subsequently, the concordance index (C-index) of every ML combination in training, testing and external validation cohorts was obtained (<xref ref-type="bibr" rid="B19">19</xref>). The top five ML combinations yielding the highest average C-index across three cohorts were selected for model evaluation via k-fold cross-validation, to mitigate overfitting and ensure the robustness and generalizability of model. Logarithmic loss, recall and decision calibration were utilized to select the best prognostic ML combination via &#x201c;mlr3proba&#x201d; R package (<xref ref-type="bibr" rid="B20">20</xref>). We incorporated variables from various feature selection patterns to compute risk scores using a linear combination function for each prognostic ML combination. The median risk score from the training cohort was chosen as the threshold to categorize patients in training, testing and external validation cohorts into high or low-risk groups. We utilized the Kaplan-Meier (KM) survival analysis and the log-rank test on these groups, using the &#x201c;survival&#x201d; and &#x201c;survminer&#x201d; R packages. AUC, time-dependent receiver operating characteristic (ROC) curves, calibration curves and DCA were employed to evaluate the precision, discrimination and clinical benefit of the model.</p>
</sec>
</sec>
<sec id="s3" sec-type="results">
<title>Results</title>
<sec id="s3_1">
<title>Demographic composition and clinical baseline information</title>
<p>In the predictive model for three-year survival, a total of 20064 pancreatic cancer patients from SEER database and 103 patients from The First People&#x2019;s Hospital of Lianyungang were included. We divided patients from SEER database randomly into training and internal validation sets in a 7:3 ratio, respectively. And pancreatic cancer patients from The First People&#x2019;s Hospital of Lianyungang were assigned as the external validation set. In the trainset from SEER database, 2579 cases (18.3%) were alive at three-year follow-up, while 11548 cases (81.7%) did not. Detailed clinical information regarding the training and validation sets to predict three-year survival can be found in <xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref>. For the outcomes (in terms of OS) of prognostic model, 13157 cases (93.1%) were dead at the time of follow-up, while 970 cases (6.87%) were alive (<xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref>). In the training, internal validation and external validation sets, the median follow-up time was 12.0 [5.00;26.0], 12.0 [5.00;27.0] and 16.0 [6.00;30.5] (<xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref>). The specific selection process of patients from SEER database is shown in <xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1</bold>
</xref>.</p>
<table-wrap id="T1" position="float">
<label>Table&#xa0;1</label>
<caption>
<p>Clinicopathological characteristics of patients with pancreatic cancer in the training, internal validation and external validation cohorts.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="top" align="center"/>
<th valign="top" align="center">Training Cohort N=14127</th>
<th valign="top" align="center">Validation Cohort N=5937</th>
<th valign="top" align="center">External Validation Cohort N=103</th>
<th valign="top" align="center">p.overall</th>
</tr>
</thead>
<tbody>
<tr>
<th valign="top" align="left">Sex</th>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center">0.997</th>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Male</td>
<td valign="top" align="center"/>
<td valign="bottom" align="center"/>
<td valign="bottom" align="center"/>
<td valign="top" align="center"/>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Female</td>
<td valign="top" align="center">7162 (50.7%)</td>
<td valign="top" align="center">3013 (50.7%)</td>
<td valign="top" align="center">52 (50.5%)</td>
<td valign="top" align="center"/>
</tr>
<tr>
<th valign="top" align="left">Age</th>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center">0.046</th>
</tr>
<tr>
<td valign="bottom" align="left">&#x2003;&lt;50</td>
<td valign="bottom" align="center">1048 (7.42%)</td>
<td valign="bottom" align="center">419 (7.06%)</td>
<td valign="bottom" align="center">11 (10.7%)</td>
<td valign="bottom" align="center"/>
</tr>
<tr>
<td valign="bottom" align="left">&#x2003;50-59</td>
<td valign="bottom" align="center">2928 (20.7%)</td>
<td valign="bottom" align="center">1223 (20.6%)</td>
<td valign="bottom" align="center">21 (20.4%)</td>
<td valign="bottom" align="center"/>
</tr>
<tr>
<td valign="bottom" align="left">&#x2003;60-69</td>
<td valign="bottom" align="center">4567 (32.3%)</td>
<td valign="bottom" align="center">1963 (33.1%)</td>
<td valign="bottom" align="center">17 (16.5%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<td valign="bottom" align="left">&#x2003;70-79</td>
<td valign="bottom" align="center">3936 (27.9%)</td>
<td valign="bottom" align="center">1654 (27.9%)</td>
<td valign="bottom" align="center">38 (36.9%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<td valign="bottom" align="left">&#x2003;&gt;=80</td>
<td valign="bottom" align="center">1648 (11.7%)</td>
<td valign="bottom" align="center">678 (11.4%)</td>
<td valign="bottom" align="center">16 (15.5%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<th valign="top" align="left">Race</th>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center">&lt;0.001</th>
</tr>
<tr>
<td valign="top" align="left">&#x2003;White</td>
<td valign="bottom" align="center">11343 (80.3%)</td>
<td valign="bottom" align="center">4772 (80.4%)</td>
<td valign="bottom" align="center">0 (0.00%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Black</td>
<td valign="bottom" align="center">1558 (11.0%)</td>
<td valign="bottom" align="center">641 (10.8%)</td>
<td valign="bottom" align="center">0 (0.00%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Other</td>
<td valign="bottom" align="center">1226 (8.68%)</td>
<td valign="bottom" align="center">524 (8.83%)</td>
<td valign="bottom" align="center">103 (100%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<th valign="top" align="left">Marital_Status</th>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center">0.378</th>
</tr>
<tr>
<td valign="bottom" align="left">&#x2003;Married</td>
<td valign="bottom" align="center">8571 (60.7%)</td>
<td valign="bottom" align="center">3614 (60.9%)</td>
<td valign="bottom" align="center">69 (67.0%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<td valign="bottom" align="left">&#x2003;Unmarried</td>
<td valign="bottom" align="center">1782 (12.6%)</td>
<td valign="bottom" align="center">720 (12.1%)</td>
<td valign="bottom" align="center">14 (13.6%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<td valign="bottom" align="left">&#x2003;Widowed or divorced</td>
<td valign="bottom" align="center">3365 (23.8%)</td>
<td valign="bottom" align="center">1418 (23.9%)</td>
<td valign="bottom" align="center">20 (19.4%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<td valign="bottom" align="left">&#x2003;Unknown</td>
<td valign="bottom" align="center">409 (2.90%)</td>
<td valign="bottom" align="center">185 (3.12%)</td>
<td valign="bottom" align="center">0 (0.00%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<th valign="top" align="left">Year_of_Diagnosis</th>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center">&lt;0.001</th>
</tr>
<tr>
<td valign="top" align="left">&#x2003;2000-2010</td>
<td valign="bottom" align="center">7649 (54.1%)</td>
<td valign="bottom" align="center">3221 (54.3%)</td>
<td valign="bottom" align="center">78 (75.7%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;2011-2020</td>
<td valign="bottom" align="center">6478 (45.9%)</td>
<td valign="bottom" align="center">2716 (45.7%)</td>
<td valign="bottom" align="center">25 (24.3%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<th valign="top" align="left">Household_Location</th>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center">0.684</th>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Rural</td>
<td valign="bottom" align="center">1587 (11.2%)</td>
<td valign="bottom" align="center">656 (11.0%)</td>
<td valign="bottom" align="center">9 (8.74%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Urban</td>
<td valign="bottom" align="center">12540 (88.8%)</td>
<td valign="bottom" align="center">5281 (89.0%)</td>
<td valign="bottom" align="center">94 (91.3%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<th valign="top" align="left">Household_Income</th>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center">&lt;0.001</th>
</tr>
<tr>
<td valign="top" align="left">&#x2003;&lt;$70,000</td>
<td valign="bottom" align="center">4765 (33.7%)</td>
<td valign="bottom" align="center">1974 (33.2%)</td>
<td valign="bottom" align="center">9 (8.74%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;&gt;=$70,000</td>
<td valign="bottom" align="center">9362 (66.3%)</td>
<td valign="bottom" align="center">3963 (66.8%)</td>
<td valign="bottom" align="center">94 (91.3%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<th valign="top" align="left">Tumor_Primary_Site</th>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center">0.519</th>
</tr>
<tr>
<td valign="bottom" align="left">&#x2003;Pancreas Head</td>
<td valign="bottom" align="center">9330 (66.0%)</td>
<td valign="bottom" align="center">3924 (66.1%)</td>
<td valign="bottom" align="center">63 (61.2%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<td valign="bottom" align="left">&#x2003;Pancreas Body or Tail</td>
<td valign="bottom" align="center">2910 (20.6%)</td>
<td valign="bottom" align="center">1259 (21.2%)</td>
<td valign="bottom" align="center">24 (23.3%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<td valign="bottom" align="left">&#x2003;Other</td>
<td valign="bottom" align="center">1887 (13.4%)</td>
<td valign="bottom" align="center">754 (12.7%)</td>
<td valign="bottom" align="center">16 (15.5%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<th valign="top" align="left">Histology</th>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center">0.633</th>
</tr>
<tr>
<td valign="bottom" align="left">&#x2003;Adenomas and adenocarcinomas</td>
<td valign="bottom" align="center">9285 (65.7%)</td>
<td valign="bottom" align="center">3940 (66.4%)</td>
<td valign="bottom" align="center">73 (70.9%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<td valign="bottom" align="left">&#x2003;Ductal and lobular neoplasms</td>
<td valign="bottom" align="center">3769 (26.7%)</td>
<td valign="bottom" align="center">1586 (26.7%)</td>
<td valign="bottom" align="center">23 (22.3%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<td valign="bottom" align="left">&#x2003;Cystic, mucinous and serous neoplasms</td>
<td valign="bottom" align="center">854 (6.05%)</td>
<td valign="bottom" align="center">329 (5.54%)</td>
<td valign="bottom" align="center">6 (5.83%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<td valign="bottom" align="left">&#x2003;Other</td>
<td valign="bottom" align="center">219 (1.55%)</td>
<td valign="bottom" align="center">82 (1.38%)</td>
<td valign="bottom" align="center">1 (0.97%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<th valign="top" align="left">Grade</th>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center">0.629</th>
</tr>
<tr>
<td valign="bottom" align="left">&#x2003;Well differentiated I</td>
<td valign="bottom" align="center">1673 (11.8%)</td>
<td valign="bottom" align="center">709 (11.9%)</td>
<td valign="bottom" align="center">13 (12.6%)</td>
<td valign="bottom" align="center"/>
</tr>
<tr>
<td valign="bottom" align="left">&#x2003;Moderately differentiated II</td>
<td valign="bottom" align="center">6606 (46.8%)</td>
<td valign="bottom" align="center">2783 (46.9%)</td>
<td valign="bottom" align="center">48 (46.6%)</td>
<td valign="bottom" align="center"/>
</tr>
<tr>
<td valign="bottom" align="left">&#x2003;Poorly differentiated III</td>
<td valign="bottom" align="center">5645 (40.0%)</td>
<td valign="bottom" align="center">2376 (40.0%)</td>
<td valign="bottom" align="center">39 (37.9%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<td valign="bottom" align="left">&#x2003;Undifferentiated anaplastic IV</td>
<td valign="bottom" align="center">203 (1.44%)</td>
<td valign="bottom" align="center">69 (1.16%)</td>
<td valign="bottom" align="center">3 (2.91%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<th valign="top" align="left">Summary_Stage</th>
<th valign="top" align="center"/>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center"/>
<th valign="top" align="center">0.186</th>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Localized</td>
<td valign="top" align="center">1341 (9.49%)</td>
<td valign="top" align="center">533 (8.98%)</td>
<td valign="top" align="center">16 (15.5%)</td>
<td valign="top" align="center">
</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Regional</td>
<td valign="top" align="center">8635 (61.1%)</td>
<td valign="top" align="center">3636 (61.2%)</td>
<td valign="top" align="center">57 (55.3%)</td>
<td valign="top" align="center">
</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Distant</td>
<td valign="top" align="center">4151 (29.4%)</td>
<td valign="top" align="center">1768 (29.8%)</td>
<td valign="top" align="center">30 (29.1%)</td>
<td valign="top" align="center">
</td>
</tr>
<tr>
<th valign="top" align="left">AJCC_Stage</th>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center">0.360</th>
</tr>
<tr>
<td valign="bottom" align="left">&#x2003;I</td>
<td valign="bottom" align="center">1341 (9.49%)</td>
<td valign="bottom" align="center">533 (8.98%)</td>
<td valign="bottom" align="center">16 (15.5%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<td valign="bottom" align="left">&#x2003;II</td>
<td valign="bottom" align="center">8000 (56.6%)</td>
<td valign="bottom" align="center">3392 (57.1%)</td>
<td valign="bottom" align="center">54 (52.4%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<td valign="bottom" align="left">&#x2003;III</td>
<td valign="bottom" align="center">1448 (10.2%)</td>
<td valign="bottom" align="center">590 (9.94%)</td>
<td valign="bottom" align="center">10 (9.71%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<td valign="bottom" align="left">&#x2003;IV</td>
<td valign="bottom" align="center">3338 (23.6%)</td>
<td valign="bottom" align="center">1422 (24.0%)</td>
<td valign="bottom" align="center">23 (22.3%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<th valign="top" align="left">T_Stage</th>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center">0.459</th>
</tr>
<tr>
<td valign="bottom" align="left">&#x2003;T1</td>
<td valign="bottom" align="center">633 (4.48%)</td>
<td valign="bottom" align="center">284 (4.78%)</td>
<td valign="bottom" align="center">7 (6.80%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<td valign="bottom" align="left">&#x2003;T2</td>
<td valign="bottom" align="center">2352 (16.6%)</td>
<td valign="bottom" align="center">964 (16.2%)</td>
<td valign="bottom" align="center">22 (21.4%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<td valign="bottom" align="left">&#x2003;T3</td>
<td valign="bottom" align="center">8764 (62.0%)</td>
<td valign="bottom" align="center">3718 (62.6%)</td>
<td valign="bottom" align="center">56 (54.4%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<td valign="bottom" align="left">&#x2003;T4</td>
<td valign="bottom" align="center">2378 (16.8%)</td>
<td valign="bottom" align="center">971 (16.4%)</td>
<td valign="bottom" align="center">18 (17.5%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<th valign="top" align="left">N_Stage</th>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center">0.758</th>
</tr>
<tr>
<td valign="bottom" align="left">&#x2003;N0</td>
<td valign="bottom" align="center">6526 (46.2%)</td>
<td valign="bottom" align="center">2776 (46.8%)</td>
<td valign="bottom" align="center">47 (45.6%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<td valign="bottom" align="left">&#x2003;N1</td>
<td valign="bottom" align="center">7601 (53.8%)</td>
<td valign="bottom" align="center">3161 (53.2%)</td>
<td valign="bottom" align="center">56 (54.4%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<th valign="top" align="left">M_Stage</th>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center">0.839</th>
</tr>
<tr>
<td valign="bottom" align="left">&#x2003;M0</td>
<td valign="bottom" align="center">10789 (76.4%)</td>
<td valign="bottom" align="center">4515 (76.0%)</td>
<td valign="bottom" align="center">80 (77.7%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<td valign="bottom" align="left">&#x2003;M1</td>
<td valign="bottom" align="center">3338 (23.6%)</td>
<td valign="bottom" align="center">1422 (24.0%)</td>
<td valign="bottom" align="center">23 (22.3%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<th valign="top" align="left">Tumor_Size</th>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center">0.297</th>
</tr>
<tr>
<td valign="bottom" align="left">&#x2003;&lt;2cm</td>
<td valign="bottom" align="center">1084 (7.67%)</td>
<td valign="bottom" align="center">472 (7.95%)</td>
<td valign="bottom" align="center">11 (10.7%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<td valign="bottom" align="left">&#x2003;2-3.9cm</td>
<td valign="bottom" align="center">6743 (47.7%)</td>
<td valign="bottom" align="center">2798 (47.1%)</td>
<td valign="bottom" align="center">47 (45.6%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<td valign="bottom" align="left">&#x2003;4-5.9cm</td>
<td valign="bottom" align="center">3896 (27.6%)</td>
<td valign="bottom" align="center">1657 (27.9%)</td>
<td valign="bottom" align="center">29 (28.2%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<td valign="bottom" align="left">&#x2003;6-7.9cm</td>
<td valign="bottom" align="center">1050 (7.43%)</td>
<td valign="bottom" align="center">427 (7.19%)</td>
<td valign="bottom" align="center">10 (9.71%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<td valign="bottom" align="left">&#x2003;&gt;8cm</td>
<td valign="bottom" align="center">470 (3.33%)</td>
<td valign="bottom" align="center">211 (3.55%)</td>
<td valign="bottom" align="center">6 (5.83%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<td valign="bottom" align="left">&#x2003;Unknown</td>
<td valign="bottom" align="center">884 (6.26%)</td>
<td valign="bottom" align="center">372 (6.27%)</td>
<td valign="bottom" align="center">0 (0.00%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<th valign="top" align="left">Surgery_Type</th>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center">0.180</th>
</tr>
<tr>
<td valign="bottom" align="left">&#x2003;No Surgery</td>
<td valign="bottom" align="center">5646 (40.0%)</td>
<td valign="bottom" align="center">2408 (40.6%)</td>
<td valign="bottom" align="center">41 (39.8%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<td valign="bottom" align="left">&#x2003;Local or partial pancreatectomy</td>
<td valign="bottom" align="center">6947 (49.2%)</td>
<td valign="bottom" align="center">2829 (47.7%)</td>
<td valign="bottom" align="center">48 (46.6%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<td valign="bottom" align="left">&#x2003;Total pancreatectomy</td>
<td valign="bottom" align="center">1534 (10.9%)</td>
<td valign="bottom" align="center">700 (11.8%)</td>
<td valign="bottom" align="center">14 (13.6%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<th valign="top" align="left">Lymph_Nodes_Surgery</th>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center">0.743</th>
</tr>
<tr>
<td valign="bottom" align="left">&#x2003;No or biopsy only</td>
<td valign="bottom" align="center">5696 (40.3%)</td>
<td valign="bottom" align="center">2441 (41.1%)</td>
<td valign="bottom" align="center">42 (40.8%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<td valign="bottom" align="left">&#x2003;1-3 regional lymph nodes removed</td>
<td valign="bottom" align="center">787 (5.57%)</td>
<td valign="bottom" align="center">342 (5.76%)</td>
<td valign="bottom" align="center">7 (6.80%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<td valign="bottom" align="left">&#x2003;4 or more regional lymph nodes removed</td>
<td valign="bottom" align="center">7644 (54.1%)</td>
<td valign="bottom" align="center">3154 (53.1%)</td>
<td valign="bottom" align="center">54 (52.4%)</td>
<td valign="bottom" align="center"/>
</tr>
<tr>
<th valign="top" align="left">Regional_Lymph_Nodes</th>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center">0.676</th>
</tr>
<tr>
<td valign="top" align="left">&#x2003;No nodes were examined</td>
<td valign="bottom" align="center">5302 (37.5%)</td>
<td valign="bottom" align="center">2277 (38.4%)</td>
<td valign="bottom" align="center">38 (36.9%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Negative</td>
<td valign="bottom" align="center">3059 (21.7%)</td>
<td valign="bottom" align="center">1267 (21.3%)</td>
<td valign="bottom" align="center">25 (24.3%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Positive</td>
<td valign="bottom" align="center">5729 (40.6%)</td>
<td valign="bottom" align="center">2384 (40.2%)</td>
<td valign="bottom" align="center">40 (38.8%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Unknown</td>
<td valign="bottom" align="center">37 (0.26%)</td>
<td valign="bottom" align="center">9 (0.15%)</td>
<td valign="bottom" align="center">0 (0.00%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<th valign="top" align="left">Chemotherapy</th>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center">0.911</th>
</tr>
<tr>
<td valign="top" align="left">&#x2003;None/Unknown</td>
<td valign="bottom" align="center">4666 (33.0%)</td>
<td valign="bottom" align="center">1945 (32.8%)</td>
<td valign="bottom" align="center">35 (34.0%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Yes</td>
<td valign="bottom" align="center">9461 (67.0%)</td>
<td valign="bottom" align="center">3992 (67.2%)</td>
<td valign="bottom" align="center">68 (66.0%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<th valign="top" align="left">Radiation</th>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center">0.328</th>
</tr>
<tr>
<td valign="top" align="left">&#x2003;None/Unknown</td>
<td valign="bottom" align="center">9995 (70.8%)</td>
<td valign="bottom" align="center">4174 (70.3%)</td>
<td valign="bottom" align="center">79 (76.7%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Yes</td>
<td valign="bottom" align="center">4132 (29.2%)</td>
<td valign="bottom" align="center">1763 (29.7%)</td>
<td valign="bottom" align="center">24 (23.3%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<th valign="top" align="left">Metastasis</th>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center">0.940</th>
</tr>
<tr>
<td valign="top" align="left">&#x2003;No</td>
<td valign="bottom" align="center">5859 (41.5%)</td>
<td valign="bottom" align="center">2465 (41.5%)</td>
<td valign="bottom" align="center">41 (39.8%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Yes</td>
<td valign="bottom" align="center">8268 (58.5%)</td>
<td valign="bottom" align="center">3472 (58.5%)</td>
<td valign="bottom" align="center">62 (60.2%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<th valign="top" align="left">Bone_Metastasis</th>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center">0.804</th>
</tr>
<tr>
<td valign="top" align="left">&#x2003;No</td>
<td valign="bottom" align="center">7530 (53.3%)</td>
<td valign="bottom" align="center">3180 (53.6%)</td>
<td valign="bottom" align="center">54 (52.4%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Yes</td>
<td valign="bottom" align="center">97 (0.69%)</td>
<td valign="bottom" align="center">47 (0.79%)</td>
<td valign="bottom" align="center">0 (0.00%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Unknown</td>
<td valign="bottom" align="center">6500 (46.0%)</td>
<td valign="bottom" align="center">2710 (45.6%)</td>
<td valign="bottom" align="center">49 (47.6%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<th valign="top" align="left">Brain_Metastasis</th>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center">0.485</th>
</tr>
<tr>
<td valign="top" align="left">&#x2003;No</td>
<td valign="bottom" align="center">7620 (53.9%)</td>
<td valign="bottom" align="center">3227 (54.4%)</td>
<td valign="bottom" align="center">54 (52.4%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Yes</td>
<td valign="bottom" align="center">5 (0.04%)</td>
<td valign="bottom" align="center">0 (0.00%)</td>
<td valign="bottom" align="center">0 (0.00%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Unknown</td>
<td valign="bottom" align="center">6502 (46.0%)</td>
<td valign="bottom" align="center">2710 (45.6%)</td>
<td valign="bottom" align="center">49 (47.6%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<th valign="top" align="left">Liver_Metastasis</th>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center">0.492</th>
</tr>
<tr>
<td valign="top" align="left">&#x2003;No</td>
<td valign="bottom" align="center">6381 (45.2%)</td>
<td valign="bottom" align="center">2667 (44.9%)</td>
<td valign="bottom" align="center">48 (46.6%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Yes</td>
<td valign="bottom" align="center">1264 (8.95%)</td>
<td valign="bottom" align="center">569 (9.58%)</td>
<td valign="bottom" align="center">6 (5.83%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Unknown</td>
<td valign="bottom" align="center">6482 (45.9%)</td>
<td valign="bottom" align="center">2701 (45.5%)</td>
<td valign="bottom" align="center">49 (47.6%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<th valign="top" align="left">Lung_Metastasis</th>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center">0.778</th>
</tr>
<tr>
<td valign="top" align="left">&#x2003;No</td>
<td valign="bottom" align="center">7288 (51.6%)</td>
<td valign="bottom" align="center">3073 (51.8%)</td>
<td valign="bottom" align="center">51 (49.5%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Yes</td>
<td valign="bottom" align="center">329 (2.33%)</td>
<td valign="bottom" align="center">154 (2.59%)</td>
<td valign="bottom" align="center">3 (2.91%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Unknown</td>
<td valign="bottom" align="center">6510 (46.1%)</td>
<td valign="bottom" align="center">2710 (45.6%)</td>
<td valign="bottom" align="center">49 (47.6%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<th valign="top" align="left">Survival_Months</th>
<th valign="bottom" align="center">12.0 [5.00;26.0]</th>
<th valign="bottom" align="center">12.0 [5.00;27.0]</th>
<th valign="bottom" align="center">16.0 [6.00;30.5]</th>
<th valign="bottom" align="center">0.605</th>
</tr>
<tr>
<th valign="top" align="left">Vital_Status</th>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center">0.848</th>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Alive</td>
<td valign="bottom" align="center">970 (6.87%)</td>
<td valign="bottom" align="center">421 (7.09%)</td>
<td valign="bottom" align="center">7 (6.80%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Dead</td>
<td valign="bottom" align="center">13157 (93.1%)</td>
<td valign="bottom" align="center">5516 (92.9%)</td>
<td valign="bottom" align="center">96 (93.2%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<th valign="top" align="left">Cancer_Specific_Death</th>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center">0.440</th>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Not cancer specific death</td>
<td valign="bottom" align="center">1823 (12.9%)</td>
<td valign="bottom" align="center">799 (13.5%)</td>
<td valign="bottom" align="center">11 (10.7%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Dead due to bladder cancer</td>
<td valign="bottom" align="center">12304 (87.1%)</td>
<td valign="bottom" align="center">5138 (86.5%)</td>
<td valign="bottom" align="center">92 (89.3%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<th valign="top" align="left">Other_Cause_Death</th>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center">0.430</th>
</tr>
<tr>
<td valign="bottom" align="left">&#x2003;Not other cause death</td>
<td valign="bottom" align="center">13274 (94.0%)</td>
<td valign="bottom" align="center">5559 (93.6%)</td>
<td valign="bottom" align="center">99 (96.1%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<td valign="bottom" align="left">&#x2003;Dead due to other cause</td>
<td valign="bottom" align="center">853 (6.04%)</td>
<td valign="bottom" align="center">378 (6.37%)</td>
<td valign="bottom" align="center">4 (3.88%)</td>
<td valign="bottom" align="center">
</td>
</tr>
<tr>
<th valign="top" align="left">Three_Year_Survival</th>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center"/>
<th valign="bottom" align="center">0.911</th>
</tr>
<tr>
<td valign="bottom" align="left">&#x2003;Alive</td>
<td valign="bottom" align="center">2579 (18.3%)</td>
<td valign="bottom" align="center">1097 (18.5%)</td>
<td valign="bottom" align="center">18 (17.5%)</td>
<td valign="bottom" align="center"/>
</tr>
<tr>
<td valign="bottom" align="left">&#x2003;Dead</td>
<td valign="bottom" align="center">11548 (81.7%)</td>
<td valign="bottom" align="center">4840 (81.5%)</td>
<td valign="bottom" align="center">85 (82.5%)</td>
<td valign="bottom" align="center"/>
</tr>
</tbody>
</table>
</table-wrap>
<fig id="f1" position="float">
<label>Figure&#xa0;1</label>
<caption>
<p>The workflow diagram for study design and patient screening.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-14-1488118-g001.tif"/>
</fig>
</sec>
<sec id="s3_2">
<title>Feature selection for the predictive model</title>
<p>We utilized &#x201c;autoplot&#x201d; function in &#x201c;mlr3&#x201d; R package to visualized the correlation coefficients of the baseline characteristics with three-year survival, which revealed that &#x201c;AJCC stage&#x201d; had the most significant correlation with three-year survival (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2A</bold>
</xref>). Based on our clinical experiences, we selected 24 variables for the logistic regression analysis (<xref ref-type="table" rid="T2">
<bold>Table&#xa0;2</bold>
</xref>), while the variable with a correlation coefficient &gt; 0.6 was removed. Subsequently, we performed univariate and multivariate logistic regression analysis in the training cohort to find the effective variables to predict three-year survival, which revealed that &#x201c;Age&#x201d; (OR 1.67(1.35-2.06)), &#x201c;Marital_Status&#x201d; (OR 1.27(1.14-1.42)), &#x201c;Household_Income&#x201d; (OR 0.75(0.68-0.83)), &#x201c;Histology&#x201d; (OR 0.5(0.43-0.59)), &#x201c;Grade&#x201d; (OR 2.4(1.59-3.72)), &#x201c;Summary_Stage&#x201d; (OR 3.12(2.27-4.31)), &#x201c;Tumor_Size&#x201d; (OR 2.63(2.08-3.34)), &#x201c;AJCC_Stage&#x201d; (OR 1.59(1.09-2.35)), &#x201c;Surgery_Type&#x201d; (OR 0.15(0.11-0.2)), &#x201c;Radiotherapy&#x201d; (OR 0.79(0.72-0.87)), &#x201c;Chemotherapy&#x201d; (OR 0.57(0.52-0.64)), &#x201c;Lung_Metastasis&#x201d; (OR 0.2(0.06-0.99)), &#x201c;M_Stage&#x201d; (OR 1.26(1.07-1.48)) were significantly powerful to predict three-year survival (P &lt; 0.05, <xref ref-type="table" rid="T2">
<bold>Table&#xa0;2</bold>
</xref>). The correlation analysis between the variables and three-year survival showed that &#x201c;AJCC_stage&#x201d; is the most influential factor (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2B</bold>
</xref>). Due to high correlation between &#x201c;AJCC_stage&#x201d; and &#x201c;Summary_Stage&#x201d;, we only choose &#x201c;AJCC_stage&#x201d; in the following analysis. Afterwards, we utilized Recursive Feature Elimination (RFE) method based on six ML algorithms (GBM, SVM, RF, DT, XGB and CatBoost), combined with 5-fold cross-validation, to sift through the clinic features (<xref ref-type="fig" rid="f2">
<bold>Figures&#xa0;2C&#x2013;H</bold>
</xref>). Feature selection based on RFE found that the optimal selection was according to GBM algorithm, remaining 12 variables, with the highest AUC (0.819, <xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2C</bold>
</xref>). We utilized RRA algorithm to obtain the comprehensive ranking of the clinic variables in six ML algorithms, with the &#x201c;AJCC_stage&#x201d; considered most important (<xref ref-type="supplementary-material" rid="ST1">
<bold>Supplementary Table&#xa0;1</bold>
</xref>). We finally select eight variables with frequencies more than 4, which indicates that these variables are important in most of the ML selection process, into the following procedures of model development (<xref ref-type="supplementary-material" rid="ST1">
<bold>Supplementary Table&#xa0;1</bold>
</xref>).</p>
<fig id="f2" position="float">
<label>Figure&#xa0;2</label>
<caption>
<p>The process of feature selection. <bold>(A)</bold> The correlation coefficients of the baseline characteristics with three-year survival. <bold>(B)</bold> The heatmap of Spearman&#x2019;s correlation analysis of the clinic variables with three-year survival. The correlation index ranges from -1.0 to 1.0, with a brighter color indicating a stronger correlation. <bold>(C&#x2013;H)</bold> Feature selection process with Recursive Feature Elimination (RFE) method based on six ML algorithms (GBM, SVM, RF, DT, XGB and CatBoost).</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-14-1488118-g002.tif"/>
</fig>
<table-wrap id="T2" position="float">
<label>Table&#xa0;2</label>
<caption>
<p>Univariate and multivariate logistics analysis of pancreatic cancer patients for 3-year survival in the training cohort.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="top" align="left">Variable</th>
<th valign="top" colspan="2" align="center">Univariable logistic analysis</th>
<th valign="top" colspan="2" align="center">Multivariate logistic analysis</th>
</tr>
<tr>
<th valign="top" align="left">term</th>
<th valign="top" align="center">OR (95%CI)</th>
<th valign="top" align="center">p.value</th>
<th valign="top" align="center">OR (95%CI)</th>
<th valign="top" align="center">p.value</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Sex: Male</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
</tr>
<tr>
<td valign="top" align="left">Female</td>
<td valign="middle" align="center">0.92 (0.85-1)</td>
<td valign="middle" align="center">0.064</td>
<td valign="middle" align="center">\</td>
<td valign="middle" align="center">\</td>
</tr>
<tr>
<td valign="top" align="left">Age: &lt;50</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
</tr>
<tr>
<td valign="top" align="left">50-59</td>
<td valign="middle" align="center">1.12 (0.95-1.33)</td>
<td valign="middle" align="center">0.185</td>
<td valign="middle" align="center">1.05 (0.89-1.24)</td>
<td valign="middle" align="center">0.568</td>
</tr>
<tr>
<td valign="top" align="left">60-69</td>
<td valign="middle" align="center">1.15 (0.98-1.35)</td>
<td valign="middle" align="center">0.089</td>
<td valign="middle" align="center">1.18 (1.01-1.39)</td>
<td valign="middle" align="center">0.04</td>
</tr>
<tr>
<td valign="top" align="left">70-79</td>
<td valign="middle" align="center">1.51 (1.28-1.79)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">1.41 (1.19-1.66)</td>
<td valign="middle" align="center">&lt;0.001</td>
</tr>
<tr>
<td valign="top" align="left">&gt;=80</td>
<td valign="middle" align="center">2.46 (1.99-3.05)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">1.67 (1.35-2.06)</td>
<td valign="middle" align="center">&lt;0.001</td>
</tr>
<tr>
<td valign="top" align="left">Race: White</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Black</td>
<td valign="middle" align="center">1.15 (1-1.33)</td>
<td valign="middle" align="center">0.047</td>
<td valign="middle" align="center">1.01 (0.88-1.16)</td>
<td valign="middle" align="center">0.898</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Other</td>
<td valign="middle" align="center">1.02 (0.87-1.19)</td>
<td valign="middle" align="center">0.841</td>
<td valign="middle" align="center">1.04 (0.9-1.2)</td>
<td valign="middle" align="center">0.604</td>
</tr>
<tr>
<td valign="top" align="left">Marital_Status: Married</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Unmarried</td>
<td valign="middle" align="center">1.21 (1.06-1.38)</td>
<td valign="middle" align="center">0.006</td>
<td valign="middle" align="center">1.18 (1.03-1.34)</td>
<td valign="middle" align="center">0.015</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Widowed or divorced</td>
<td valign="middle" align="center">1.47 (1.32-1.64)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">1.27 (1.14-1.42)</td>
<td valign="middle" align="center">&lt;0.001</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Unknown</td>
<td valign="middle" align="center">1.21 (0.94-1.59)</td>
<td valign="middle" align="center">0.154</td>
<td valign="middle" align="center">1.3 (1.02-1.68)</td>
<td valign="middle" align="center">0.038</td>
</tr>
<tr>
<td valign="top" align="left">Household_Income: &lt;$70,000</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center"/>
<td valign="middle" align="center"/>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="top" align="left">&gt;=$70,000</td>
<td valign="middle" align="center">0.81 (0.74-0.89)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">0.75 (0.68-0.83)</td>
<td valign="middle" align="center">&lt;0.001</td>
</tr>
<tr>
<td valign="top" align="left">Household_Location: Rural</td>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
<td valign="middle" align="center"/>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Urban</td>
<td valign="middle" align="center">0.84 (0.73-0.96)</td>
<td valign="middle" align="center">0.014</td>
<td valign="middle" align="center">0.94 (0.81-1.08)</td>
<td valign="middle" align="center">0.386</td>
</tr>
<tr>
<td valign="top" align="left">Tumor_Primary_Site: Pancreas Head</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Pancreas Body or Tail</td>
<td valign="middle" align="center">1.27 (1.14-1.42)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">0.91 (0.79-1.05)</td>
<td valign="middle" align="center">0.191</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Other</td>
<td valign="middle" align="center">1.51 (1.31-1.73)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">1.05 (0.91-1.21)</td>
<td valign="middle" align="center">0.488</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Histology: Adenomas and adenocarcinomas</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Ductal and lobular neoplasms</td>
<td valign="middle" align="center">0.55 (0.5-0.6)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">1.05 (0.96-1.15)</td>
<td valign="middle" align="center">0.3</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Cystic, mucinous and serous neoplasms</td>
<td valign="middle" align="center">0.41 (0.35-0.48)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">0.5 (0.43-0.59)</td>
<td valign="middle" align="center">&lt;0.001</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Other</td>
<td valign="middle" align="center">0.92 (0.64-1.34)</td>
<td valign="middle" align="center">0.642</td>
<td valign="middle" align="center">0.86 (0.62-1.2)</td>
<td valign="middle" align="center">0.359</td>
</tr>
<tr>
<td valign="top" align="left">Grade: Well differentiated I</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center"/>
<td valign="middle" align="center"/>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Moderately differentiated II</td>
<td valign="middle" align="center">1.56 (1.38-1.76)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">1.77 (1.57-2)</td>
<td valign="middle" align="center">&lt;0.001</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Poorly differentiated III</td>
<td valign="middle" align="center">3.12 (2.73-3.56)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">2.75 (2.41-3.14)</td>
<td valign="middle" align="center">&lt;0.001</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Undifferentiated anaplastic IV</td>
<td valign="middle" align="center">2.97 (1.97-4.68)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">2.4 (1.59-3.72)</td>
<td valign="middle" align="center">&lt;0.001</td>
</tr>
<tr>
<td valign="top" align="left">Summary_Stage: Localized</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center"/>
<td valign="middle" align="center"/>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Regional</td>
<td valign="middle" align="center">2.55 (2.26-2.87)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">1.74 (1.31-2.3)</td>
<td valign="middle" align="center">&lt;0.001</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Distant</td>
<td valign="middle" align="center">15.52 (12.92-18.72)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">3.12 (2.27-4.31)</td>
<td valign="middle" align="center">&lt;0.001</td>
</tr>
<tr>
<td valign="top" align="left">AJCC_Stage: I</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center"/>
<td valign="middle" align="center"/>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="top" align="left">&#x2003;II</td>
<td valign="middle" align="center">2.34 (2.07-2.64)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">1.11 (0.89-1.39)</td>
<td valign="middle" align="center">0.336</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;III</td>
<td valign="middle" align="center">8.99 (7.19-11.33)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">1.17 (0.93-1.48)</td>
<td valign="middle" align="center">0.179</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;IV</td>
<td valign="middle" align="center">24.81 (19.71-31.56)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">1.59 (1.09-2.35)</td>
<td valign="middle" align="center">0.018</td>
</tr>
<tr>
<td valign="top" align="left">T_Stage: T1</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center"/>
<td valign="middle" align="center"/>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="top" align="left">&#x2003;T2</td>
<td valign="middle" align="center">3.5 (2.9-4.22)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">1.11 (0.89-1.38)</td>
<td valign="middle" align="center">0.374</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;T3</td>
<td valign="middle" align="center">3.33 (2.83-3.93)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">1.17 (0.92-1.47)</td>
<td valign="middle" align="center">0.196</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;T4</td>
<td valign="middle" align="center">15.41 (12.14-19.67)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">1.59 (1.03-2.54)</td>
<td valign="middle" align="center">0.051</td>
</tr>
<tr>
<td valign="top" align="left">N_Stage: N0</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center"/>
<td valign="middle" align="center"/>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="top" align="left">&#x2003;N1</td>
<td valign="middle" align="center">1.26 (1.16-1.38)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">1.1 (0.86-1.41)</td>
<td valign="middle" align="center">0.448</td>
</tr>
<tr>
<td valign="top" align="left">M_Stage: M0</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center"/>
<td valign="middle" align="center"/>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="top" align="left">&#x2003;M1</td>
<td valign="middle" align="center">10.69 (8.7-13.32)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">1.26 (1.07-1.48)</td>
<td valign="middle" align="center">0.005</td>
</tr>
<tr>
<td valign="top" align="left">Tumor_Size: &lt;2cm</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center"/>
<td valign="middle" align="center"/>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="top" align="left">&#x2003;2-3.9cm</td>
<td valign="middle" align="center">2.75 (2.4-3.15)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">1.74 (1.5-2.02)</td>
<td valign="middle" align="center">&lt;0.001</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;4-5.9cm</td>
<td valign="middle" align="center">4.57 (3.92-5.32)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">2.19 (1.85-2.59)</td>
<td valign="middle" align="center">&lt;0.001</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;6-7.9cm</td>
<td valign="middle" align="center">5.8 (4.62-7.32)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">2.63 (2.08-3.34)</td>
<td valign="middle" align="center">&lt;0.001</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;&gt;8cm</td>
<td valign="middle" align="center">3.62 (2.77-4.79)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">1.63 (1.22-2.19)</td>
<td valign="middle" align="center">0.001</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Unknown</td>
<td valign="middle" align="center">9.43 (7.13-12.67)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">1.72 (1.3-2.3)</td>
<td valign="middle" align="center">&lt;0.001</td>
</tr>
<tr>
<td valign="top" align="left">Surgery_Type: No Surgery</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center"/>
<td valign="middle" align="center"/>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Local or partial pancreatectomy</td>
<td valign="middle" align="center">0.07 (0.06-0.08)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">0.15 (0.11-0.2)</td>
<td valign="middle" align="center">&lt;0.001</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Total pancreatectomy</td>
<td valign="middle" align="center">0.08 (0.06-0.09)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">0.15 (0.12-0.21)</td>
<td valign="middle" align="center">&lt;0.001</td>
</tr>
<tr>
<td valign="top" align="left">Lymph_Nodes_Surgery: No or biopsy only</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center"/>
<td valign="middle" align="center"/>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="top" align="left">&#x2003;1-3 regional lymph nodes removed</td>
<td valign="middle" align="center">0.14 (0.11-0.17)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">1.09 (0.76-1.54)</td>
<td valign="middle" align="center">0.652</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;4 or more regional lymph nodes removed</td>
<td valign="middle" align="center">0.09 (0.08-0.11)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">0.74 (0.53-1.02)</td>
<td valign="middle" align="center">0.067</td>
</tr>
<tr>
<td valign="top" align="left">Regional_Lymph_Nodes: No nodes were examined</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center"/>
<td valign="middle" align="center"/>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Negative</td>
<td valign="middle" align="center">0.06 (0.05-0.07)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">0.75 (0.51-1.12)</td>
<td valign="middle" align="center">0.158</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Positive</td>
<td valign="middle" align="center">0.14 (0.12-0.17)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">1.28 (0.88-1.86)</td>
<td valign="middle" align="center">0.196</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Unknown</td>
<td valign="middle" align="center">0.19 (0.09-0.52)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">0.53 (0.21-1.54)</td>
<td valign="middle" align="center">0.205</td>
</tr>
<tr>
<td valign="top" align="left">Chemotherapy: None/Unknown</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center"/>
<td valign="middle" align="center"/>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Yes</td>
<td valign="middle" align="center">0.57 (0.51-0.63)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">0.57 (0.52-0.64)</td>
<td valign="middle" align="center">&lt;0.001</td>
</tr>
<tr>
<td valign="top" align="left">Radiotherapy: None/Unknown</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center"/>
<td valign="middle" align="center"/>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Yes</td>
<td valign="middle" align="center">0.55 (0.5-0.6)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">0.79 (0.72-0.87)</td>
<td valign="middle" align="center">&lt;0.001</td>
</tr>
<tr>
<td valign="top" align="left">Metastasis: No</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center"/>
<td valign="middle" align="center"/>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Yes</td>
<td valign="middle" align="center">2.37 (2.17-2.58)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">0.9 (0.6-1.4)</td>
<td valign="middle" align="center">0.633</td>
</tr>
<tr>
<td valign="top" align="left">Bone_Metastasis: No</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center"/>
<td valign="middle" align="center"/>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Yes</td>
<td valign="middle" align="center">12.58 (3.98-76.41)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">2.29 (0.68-14.29)</td>
<td valign="middle" align="center">0.262</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Unknown</td>
<td valign="middle" align="center">1.46 (1.34-1.59)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">0.83 (0.05-21.63)</td>
<td valign="middle" align="center">0.919</td>
</tr>
<tr>
<td valign="top" align="left">Brain_Metastasis: No</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center"/>
<td valign="middle" align="center"/>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Yes</td>
<td valign="top" align="center">2.92 (0-NA)</td>
<td valign="top" align="center">0.908</td>
<td valign="middle" align="center">1766.26 (0-NA)</td>
<td valign="middle" align="center">0.958</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Unknown</td>
<td valign="middle" align="center">1.44 (1.32-1.57)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">0.96 (0.06-25.1)</td>
<td valign="middle" align="center">0.984</td>
</tr>
<tr>
<td valign="top" align="left">Liver_Metastasis: No</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center"/>
<td valign="middle" align="center"/>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Yes</td>
<td valign="middle" align="center">10 (7.34-14.05)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">1.03 (0.58-1.79)</td>
<td valign="middle" align="center">0.930</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Unknown</td>
<td valign="middle" align="center">1.75 (1.6-1.91)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">4.39 (0.42-24.26)</td>
<td valign="middle" align="center">0.150</td>
</tr>
<tr>
<td valign="top" align="left">Lung_Metastasis: No</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Yes</td>
<td valign="middle" align="center">9.75 (5.33-20.47)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">1.06 (0.51-2.44)</td>
<td valign="middle" align="center">0.877</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Unknown</td>
<td valign="middle" align="center">1.51 (1.38-1.64)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">0.2 (0.06-0.99)</td>
<td valign="middle" align="center">0.023</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="s3_3">
<title>Development and validation of predictive model for three-year survival</title>
<p>To establish a precise model to predict three-year survival, we utilized the eight variables (&#x201c;AJCC_Stage&#x201d;, &#x201c;Chemotherapy&#x201d;, &#x201c;Age&#x201d;, &#x201c;Grade&#x201d;, &#x201c;Lung_Metastasis&#x201d;, &#x201c;M_Stage&#x201d;, &#x201c;Surgery_Type&#x201d;, &#x201c;Tumor_Size&#x201d;) selected by RFE and RRA. A total of 13 ML models, comprising CatBoost, RF, SVM, XGB, DT, GBM, KNN, LR, NBC, LDA, QDA, NNET and GLM algorithms, were developed by incorporating the above selection of eight variables in the training set. Hyperparameters were fine-tuned by performing 5-cross validation and random searches. Then we evaluated the 13 ML models in the internal validation and external validation cohorts, respectively. Finally, ROC curves analysis found that CatBoost model had the highest AUC in the training (0.932 [0.924, 0.939]), internal validation (0.899 [0.873, 0.934]) and external validation (0.826 [0.735, 0.919]) cohorts (<xref ref-type="fig" rid="f3">
<bold>Figures&#xa0;3A</bold>
</xref>, <xref ref-type="fig" rid="f4">
<bold>4A</bold>
</xref>, <xref ref-type="fig" rid="f5">
<bold>5A</bold>
</xref>). CatBoost model has the accuracy of 0.839 [0.831, 0.847], sensitivity of 0.872 [0.858, 0.887], specificity of 0.803 [0.784, 0.825] and precision of 0.832 [0.821, 0.853]. After grid search in hyperparameter tuning, the best hyperparameter metric of CatBoost was depth, 5; learning_rate, 0.01678325; iterations, 548; 12_leaf_reg, 7.409126. The precision-recall curves (PRC) revealed that CatBoost model was powerful in handling imbalanced datasets (<xref ref-type="fig" rid="f3">
<bold>Figures&#xa0;3B</bold>
</xref>, <xref ref-type="fig" rid="f4">
<bold>4B</bold>
</xref>, <xref ref-type="fig" rid="f5">
<bold>5B</bold>
</xref>). Calibration plots showed that CatBoost algorithm had the best fitting ability and could accurately predict three-year survival (<xref ref-type="fig" rid="f3">
<bold>Figures&#xa0;3C</bold>
</xref>, <xref ref-type="fig" rid="f4">
<bold>4C</bold>
</xref>, <xref ref-type="fig" rid="f5">
<bold>5C</bold>
</xref>). This indicates that the model&#x2019;s probability estimates are reliable and well-calibrated, as it ensures that the risk estimates provided by the model can be trusted to reflect the true likelihood of patient outcomes. DCA curves suggested that CatBoost algorithm had the best clinical application value and could effectively help predict three-year survival (<xref ref-type="fig" rid="f3">
<bold>Figures&#xa0;3D</bold>
</xref>, <xref ref-type="fig" rid="f4">
<bold>4D</bold>
</xref>, <xref ref-type="fig" rid="f5">
<bold>5D</bold>
</xref>). This implies that using the CatBoost model to guide clinical decision-making would result in more effective identification of patients who are likely to benefit from certain interventions, such as more aggressive treatment or intensive monitoring. The accuracy, sensitivity, specificity, precision, cross-entropy, Brier scores, Balanced Accuracy (bacc) and F Beta Score (fbeta) of the 13 ML models were calculated to comprehensively evaluate the model performance, which revealed that CatBoost model was robust in predicting three-year survival (<xref ref-type="fig" rid="f3">
<bold>Figures&#xa0;3E</bold>
</xref>, <xref ref-type="fig" rid="f4">
<bold>4E</bold>
</xref>, <xref ref-type="fig" rid="f5">
<bold>5E</bold>
</xref>). The results of tenfold cross-validation indicated that CatBoost exhibited the best performance (<xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3F</bold>
</xref>). Confusion matrix displayed the outstanding predictive ability of CatBoost in the internal validation and external validation cohorts (<xref ref-type="fig" rid="f4">
<bold>Figures&#xa0;4F</bold>
</xref>, <xref ref-type="fig" rid="f5">
<bold>5F</bold>
</xref>). Therefore, CatBoost was chosen as the best model for the next step.</p>
<fig id="f3" position="float">
<label>Figure&#xa0;3</label>
<caption>
<p>Establishment and evaluation of the ML models in the training set. <bold>(A)</bold> ROC curves of different ML models in the training set. <bold>(B)</bold> PR curves of different ML models in the training set. <bold>(C)</bold> Calibration curves of different ML models in the training set. <bold>(D)</bold> DCA curves of different ML models in the training set. <bold>(E)</bold> The performance of 13 ML models in terms of AUC, PRAUC, accuracy, sensitivity, specificity, precision, cross-entropy, Brier scores and Balanced Accuracy (bacc) and F Beta Score (fbeta) in the training set. <bold>(F)</bold> Ten-fold cross-validation results of different ML models in the training set. ML, machine learning; CAT, categorical boosting; LR, logistic regression; DT, decision tree; RF, random forest; XGB, extreme gradient boosting; GBM, gradient boosting machine; NB, Naive Bayes; LDA, linear discriminant analysis; QDA, quadratic discriminant analysis; NNET, neural network; GLMNET, generalized linear models with elastic net regularization; SVM, support vector machine; KNN, k-nearest neighbor.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-14-1488118-g003.tif"/>
</fig>
<fig id="f4" position="float">
<label>Figure&#xa0;4</label>
<caption>
<p>Evaluation of the ML models in the internal validation set. <bold>(A)</bold> ROC curves of different ML models in the internal validation set. <bold>(B)</bold> PR curves of different ML models in the internal validation set. <bold>(C)</bold> Calibration curves of different ML models in the internal validation set. <bold>(D)</bold> DCA curves of different ML models in the internal validation set. <bold>(E)</bold> The performance of 13 ML models in terms of AUC, PRAUC, accuracy, sensitivity, specificity, precision, cross-entropy, Brier scores and Balanced Accuracy (bacc) and F Beta Score (fbeta) in the internal validation set. <bold>(F)</bold> Confusion matrix of the best ML model in the internal validation set. ML, machine learning; CAT, categorical boosting; LR, logistic regression; DT, decision tree; RF, random forest; XGB, extreme gradient boosting; GBM, gradient boosting machine; NB, Naive Bayes; LDA, linear discriminant analysis; QDA, quadratic discriminant analysis; NNET, neural network; GLMNET, generalized linear models with elastic net regularization; SVM, support vector machine; KNN, k-nearest neighbor.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-14-1488118-g004.tif"/>
</fig>
<fig id="f5" position="float">
<label>Figure&#xa0;5</label>
<caption>
<p>Evaluation of the ML models in the external validation set. <bold>(A)</bold> ROC curves of different ML models in the external validation set. <bold>(B)</bold> PR curves of different ML models in the external validation set. <bold>(C)</bold> Calibration curves of different ML models in the external validation set. <bold>(D)</bold> DCA curves of different ML models in the external validation set. <bold>(E)</bold> The performance of 13 ML models in terms of AUC, PRAUC, accuracy, sensitivity, specificity, precision, cross-entropy, Brier scores and Balanced Accuracy (bacc) and F Beta Score (fbeta) in the external validation set. <bold>(F)</bold> Confusion matrix of the best ML model in the external validation set. ML, machine learning; CAT, categorical boosting; LR, logistic regression; DT, decision tree; RF, random forest; XGB, extreme gradient boosting; GBM, gradient boosting machine; NB, Naive Bayes; LDA, linear discriminant analysis; QDA, quadratic discriminant analysis; NNET, neural network; GLMNET, generalized linear models with elastic net regularization; SVM, support vector machine; KNN, k-nearest neighbor.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-14-1488118-g005.tif"/>
</fig>
</sec>
<sec id="s3_4">
<title>Model interpretation</title>
<p>We calculated the feature importance rankings of each ML models and illustrated eight of them, including CatBoost, GBM, GLM, NB, KNN, RF, NNET and SVM (<xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6A</bold>
</xref>). The importance scores were determined by leveraging the inherent attributes of various ML algorithms, which revealed that the risk factors most associated with three-year survival were &#x201c;Surgery Type&#x201d;, &#x201c;AJCC Stage&#x201d; and &#x201c;M Stage&#x201d;. Subsequently, we utilized SHAP framework to interpret CatBoost model. We illustrated all of the risk factors evaluated by the mean absolute SHAP value, which revealed that &#x201c;Surgery Type&#x201d; was the most impactful variable (<xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6B</bold>
</xref>). Besides, beeswarm plot elucidated the influence of various risk factors on three-year survival (<xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6C</bold>
</xref>). The y-axis denotes the magnitude of the risk factors, while the x-axis represents their impact on the model&#x2019;s output, specifically three-year survival, as measured by the SHAP value. It was observed that no surgery, higher grade, older age, have lung metastasis, no chemotherapy, higher AJCC stage and M1 stage are associated with an increased likelihood of death in three-year follow-up. To illustrate the model&#x2019;s interpretability, we highlighted two representative cases. SHAP values were used to understand the impact of each feature on the model&#x2019;s prediction. In our study, lower SHAP values indicate a higher likelihood of three-year survival, while higher SHAP values suggest a higher probability of death within the three-year follow-up. We chose median value (0.0962) as the cut-off point for predicting the low or high probability of three-year survival. For instance, the first patient with three-year survival had a lower SHAP value and a prediction score of 0.0276, indicating a higher likelihood of three-year survival (<xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6D</bold>
</xref>). In contrast, the second patient without three-year survival showed a higher SHAP value and a prediction score of 0.187, suggesting a higher probability of death in three-year follow-up (<xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6E</bold>
</xref>).</p>
<fig id="f6" position="float">
<label>Figure&#xa0;6</label>
<caption>
<p>ML model interpretation. <bold>(A)</bold> Importance ranking of features in eight ML prediction algorithms (CatBoost, GBM, GLM, NB, KNN, RF, NNET and SVM). <bold>(B)</bold> The importance ranking of different variables according to the mean (|SHAP value|) using the optimal CatBoost model. <bold>(C)</bold> The importance ranking of different risk factors with stability and interpretation using the optimal CatBoost model. The higher SHAP value of a feature is given, the higher risk of distant metastasis the patient would have. The yellow part in feature value represents higher value. <bold>(D)</bold> SHAP value explanation in a classical sample with three-year survival. <bold>(E)</bold> SHAP value explanation in a classical sample without three-year survival.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-14-1488118-g006.tif"/>
</fig>
</sec>
<sec id="s3_5">
<title>Prognostic model establishment and performance</title>
<p>To explore the prognostic values of multiple variables, we performed univariate and multivariate Cox analysis to found that &#x201c;Sex&#x201d; (HR 0.934(0.907-0.963)), &#x201c;Race&#x201d; (HR 1.071(1.022-1.123)), &#x201c;Age&#x201d; (HR 1.19(1.119-1.264)), &#x201c;Marital_Status&#x201d; (HR 1.137(1.086-1.191)), &#x201c;Household_Income&#x201d; (HR 0.866(0.837-0.896)), &#x201c;Household_Location&#x201d; (HR 0.945(0.899-0.993)), &#x201c;Tumor_Primary_Site&#x201d; (HR 0.946(0.91-0.983)), &#x201c;Histology&#x201d; (HR 0.706(0.66-0.755)), &#x201c;Grade&#x201d; (HR 1.334(1.271-1.401)), &#x201c;Tumor_Size&#x201d; (HR 1.325(1.238-1.417)), &#x201c;AJCC_Stage&#x201d; (HR 0.712(0.643-0.789)), &#x201c;T_Stage&#x201d; (HR 1.127(1.024-1.242)), &#x201c;Surgery_Type&#x201d; (HR 0.491(0.45-0.535)), &#x201c;Lymph_Nodes_Surgery&#x201d; (HR 0.846(0.761-0.94)), &#x201c;Regional_Lymph_Nodes&#x201d; (HR 0.709(0.65-0.774)), &#x201c;Radiotherapy&#x201d; (HR 0.905(0.873-0.938)), &#x201c;Chemotherapy&#x201d; (HR 0.582(0.562-0.602)), &#x201c;Bone_Metastasis&#x201d; (HR 1.196(1.006-1.422)), &#x201c;Liver_Metastasis&#x201d; (HR 1.338(1.224-1.463)), &#x201c;Lung_Metastasis&#x201d; (HR 1.338(1.224-1.463)) and &#x201c;Metastasis&#x201d; (HR 0.781(0.709-0.861)) were independent prognosis variables for predicting OS in pancreatic cancer patients (P &lt; 0.05, <xref ref-type="table" rid="T3">
<bold>Table&#xa0;3</bold>
</xref>). Incorporating these clinical variables, 101 prognostic ML algorithm combinations were constructed via LOOCV framework. The C-index of each ML combination was calculated in training, internal validation and external validation datasets (<xref ref-type="fig" rid="f7">
<bold>Figure&#xa0;7A</bold>
</xref>). Among top five ML combinations with highest C-index across three cohorts, logarithmic loss, recall and decision calibration were calculated to assess the model performances, discovering the well calibration and precision of &#x201c;RSF+GBM&#x201d; model (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figure&#xa0;1</bold>
</xref>). The best ML model combination was &#x201c;RSF+GBM&#x201d;, which was established based on RSF algorithm in feature selection (<xref ref-type="fig" rid="f7">
<bold>Figure&#xa0;7B</bold>
</xref>), and GBM algorithm in model construction (<xref ref-type="fig" rid="f7">
<bold>Figure&#xa0;7C</bold>
</xref>), with the highest average C-index (0.723) across three datasets (<xref ref-type="fig" rid="f7">
<bold>Figure&#xa0;7A</bold>
</xref>). Finally, a 20-variable &#x201c;RSF+GBM&#x201d; prognostic ML model was accordingly established to predict OS of pancreatic patients, with &#x201c;Surgery Type&#x201d; being the most significant variable both in the feature importance visualization of RSF and GBM model (<xref ref-type="fig" rid="f7">
<bold>Figures&#xa0;7B, C</bold>
</xref>). ROC curves of 1-, 3- and 5-year OS showed well specificity of &#x201c;RSF+GBM&#x201d; model (<xref ref-type="fig" rid="f7">
<bold>Figure&#xa0;7D</bold>
</xref>). Time dependent ROC curves indicated that the curve of &#x201c;RSF+GBM&#x201d; model was upper than other curves at most of the time points, indicating that &#x201c;RSF+GBM&#x201d; model remarkably outperformed conventional clinical variables in capability of discrimination and prediction (<xref ref-type="fig" rid="f7">
<bold>Figure&#xa0;7E</bold>
</xref>). Calibration curves (<xref ref-type="fig" rid="f7">
<bold>Figure&#xa0;7F</bold>
</xref>) and DCA curves (<xref ref-type="fig" rid="f7">
<bold>Figure&#xa0;7G</bold>
</xref>) showed that &#x201c;RSF+GBM&#x201d; model is well-behaved in accuracy and clinical benefit. Based on risk scores calculated by GBM algorithm, we utilized the median risk score to divide patients in the training, internal validation and external validation cohorts into low-risk and high-risk groups, respectively. Obliviously, the low-risk group owned a relatively longer OS than the high-risk group in the training, internal validation and external validation cohorts, respectively (<xref ref-type="fig" rid="f7">
<bold>Figure&#xa0;7H</bold>
</xref>). The K-M curves validated the capability of risk stratification of &#x201c;RSF+GBM&#x201d; model. All these metrics collectively indicated that &#x201c;RSF+GBM&#x201d; model demonstrated stability and robustness in model performances. In conclusion, we have successfully developed a &#x201c;RSF+GBM&#x201d; model to predict OS in pancreatic cancer patients, which outperforming other models and was well behaved in model performances.</p>
<table-wrap id="T3" position="float">
<label>Table&#xa0;3</label>
<caption>
<p>Univariate and multivariate cox regression analysis of pancreatic cancer patients for overall survival in the training cohort.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="top" align="left">Variable</th>
<th valign="top" colspan="2" align="center">Univariable cox analysis</th>
<th valign="top" colspan="2" align="center">Multivariate cox analysis</th>
</tr>
<tr>
<th valign="top" align="left">term</th>
<th valign="top" align="center">HR (95%CI)</th>
<th valign="top" align="center">p.value</th>
<th valign="top" align="center">HR (95%CI)</th>
<th valign="top" align="center">p.value</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Sex: Male</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
</tr>
<tr>
<td valign="top" align="left">Female</td>
<td valign="middle" align="center">0.96 (0.94-0.99)</td>
<td valign="middle" align="center">0.012</td>
<td valign="middle" align="center">0.934 (0.907-0.963)</td>
<td valign="middle" align="center">&lt;0.001</td>
</tr>
<tr>
<td valign="top" align="left">Age: &lt;50</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
</tr>
<tr>
<td valign="top" align="left">50-59</td>
<td valign="middle" align="center">1.09 (1.02-1.16)</td>
<td valign="middle" align="center">0.008</td>
<td valign="middle" align="center">1.114 (1.045-1.188)</td>
<td valign="middle" align="center">0.001</td>
</tr>
<tr>
<td valign="top" align="left">60-69</td>
<td valign="middle" align="center">1.12 (1.06-1.19)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">1.19 (1.119-1.264)</td>
<td valign="middle" align="center">&lt;0.001</td>
</tr>
<tr>
<td valign="top" align="left">70-79</td>
<td valign="middle" align="center">1.33 (1.25-1.41)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">1.412 (1.326-1.502)</td>
<td valign="middle" align="center">&lt;0.001</td>
</tr>
<tr>
<td valign="top" align="left">&gt;=80</td>
<td valign="middle" align="center">1.76 (1.64-1.88)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">1.598 (1.487-1.717)</td>
<td valign="middle" align="center">&lt;0.001</td>
</tr>
<tr>
<td valign="top" align="left">Race: White</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Black</td>
<td valign="middle" align="center">1.12 (1.07-1.18)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">1.071 (1.022-1.123)</td>
<td valign="middle" align="center">0.004</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Other</td>
<td valign="middle" align="center">0.96 (0.91-1.01)</td>
<td valign="middle" align="center">0.121</td>
<td valign="middle" align="center">1.022 (0.97-1.077)</td>
<td valign="middle" align="center">0.41</td>
</tr>
<tr>
<td valign="top" align="left">Marital_Status: Married</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Unmarried</td>
<td valign="middle" align="center">1.11 (1.06-1.16)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">1.137 (1.086-1.191)</td>
<td valign="middle" align="center">&lt;0.001</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Widowed or divorced</td>
<td valign="middle" align="center">1.23 (1.19-1.27)</td>
<td valign="middle" align="center">0</td>
<td valign="middle" align="center">1.162 (1.121-1.206)</td>
<td valign="middle" align="center">&lt;0.001</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Unknown</td>
<td valign="middle" align="center">1.07 (0.98-1.16)</td>
<td valign="middle" align="center">0.151</td>
<td valign="middle" align="center">1.07 (0.981-1.167)</td>
<td valign="middle" align="center">0.126</td>
</tr>
<tr>
<td valign="top" align="left">Household_Income: &lt;$70,000</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center"/>
<td valign="middle" align="center"/>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="top" align="left">&gt;=$70,000</td>
<td valign="middle" align="center">0.89 (0.87-0.92)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">0.866 (0.837-0.896)</td>
<td valign="middle" align="center">&lt;0.001</td>
</tr>
<tr>
<td valign="top" align="left">Household_Location: Rural</td>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
<td valign="middle" align="center"/>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Urban</td>
<td valign="middle" align="center">0.91 (0.87-0.95)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">0.945 (0.899-0.993)</td>
<td valign="middle" align="center">0.025</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Tumor_Primary_Site: Pancreas Head</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Pancreas Body or Tail</td>
<td valign="middle" align="center">1.17 (1.13-1.21)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">0.946 (0.91-0.983)</td>
<td valign="middle" align="center">0.005</td>
</tr>
<tr>
<td valign="bottom" align="left">&#x2003;Other</td>
<td valign="middle" align="center">1.3 (1.25-1.36)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">1.004 (0.96-1.051)</td>
<td valign="middle" align="center">0.858</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Histology: Adenomas and adenocarcinomas</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Ductal and lobular neoplasms</td>
<td valign="middle" align="center">0.71 (0.68-0.73)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">1.022 (0.986-1.059)</td>
<td valign="middle" align="center">0.236</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Cystic, mucinous and serous neoplasms</td>
<td valign="middle" align="center">0.59 (0.55-0.63)</td>
<td valign="middle" align="center">0</td>
<td valign="middle" align="center">0.706 (0.66-0.755)</td>
<td valign="middle" align="center">&lt;0.001</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Other</td>
<td valign="middle" align="center">0.89 (0.79-1)</td>
<td valign="middle" align="center">0.05</td>
<td valign="middle" align="center">0.876 (0.776-0.988)</td>
<td valign="middle" align="center">0.032</td>
</tr>
<tr>
<td valign="top" align="left">Grade: Well differentiated I</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center"/>
<td valign="middle" align="center"/>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Moderately differentiated II</td>
<td valign="middle" align="center">1.25 (1.2-1.32)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">1.334 (1.271-1.401)</td>
<td valign="middle" align="center">&lt;0.001</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Poorly differentiated III</td>
<td valign="middle" align="center">1.74 (1.66-1.83)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">1.718 (1.635-1.806)</td>
<td valign="middle" align="center">&lt;0.001</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Undifferentiated anaplastic IV</td>
<td valign="middle" align="center">1.74 (1.53-1.99)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">1.485 (1.302-1.694)</td>
<td valign="middle" align="center">&lt;0.001</td>
</tr>
<tr>
<td valign="top" align="left">Summary_Stage: Localized</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center"/>
<td valign="middle" align="center"/>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Regional</td>
<td valign="middle" align="center">1.62 (1.53-1.71)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">1.847 (1.641-2.079)</td>
<td valign="middle" align="center">&lt;0.001</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Distant</td>
<td valign="middle" align="center">3.78 (3.56-4)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">2.136 (1.935-2.357)</td>
<td valign="middle" align="center">&lt;0.001</td>
</tr>
<tr>
<td valign="top" align="left">AJCC_Stage: I</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center"/>
<td valign="middle" align="center"/>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="top" align="left">&#x2003;II</td>
<td valign="middle" align="center">1.56 (1.48-1.65)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">0.712 (0.643-0.789)</td>
<td valign="middle" align="center">&lt;0.001</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;III</td>
<td valign="middle" align="center">2.76 (2.58-2.95)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">0.762 (0.687-0.846)</td>
<td valign="middle" align="center">&lt;0.001</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;IV</td>
<td valign="middle" align="center">4.59 (4.32-4.88)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">NA (NA-NA)</td>
<td valign="middle" align="center">NA</td>
</tr>
<tr>
<td valign="top" align="left">T_Stage: T1</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center"/>
<td valign="middle" align="center"/>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="top" align="left">&#x2003;T2</td>
<td valign="middle" align="center">2 (1.84-2.17)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">1.066 (0.969-1.172)</td>
<td valign="middle" align="center">0.19</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;T3</td>
<td valign="middle" align="center">1.85 (1.72-2)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">1.127 (1.024-1.242)</td>
<td valign="middle" align="center">0.015</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;T4</td>
<td valign="middle" align="center">3.4 (3.13-3.69)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">1.15 (1.029-1.285)</td>
<td valign="middle" align="center">0.014</td>
</tr>
<tr>
<td valign="top" align="left">N_Stage: N0</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center"/>
<td valign="middle" align="center"/>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="top" align="left">&#x2003;N1</td>
<td valign="middle" align="center">1.05 (1.02-1.08)</td>
<td valign="middle" align="center">0.002</td>
<td valign="middle" align="center">1.036 (0.988-1.087)</td>
<td valign="middle" align="center">0.148</td>
</tr>
<tr>
<td valign="top" align="left">M_Stage: M0</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center"/>
<td valign="middle" align="center"/>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="top" align="left">&#x2003;M1</td>
<td valign="middle" align="center">1.96 (1.9-2.02)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">1.017 (0.962-1.075)</td>
<td valign="middle" align="center">0.553</td>
</tr>
<tr>
<td valign="top" align="left">Tumor_Size: &lt;2cm</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center"/>
<td valign="middle" align="center"/>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="top" align="left">&#x2003;2-3.9cm</td>
<td valign="middle" align="center">1.6 (1.51-1.7)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">1.325 (1.238-1.417)</td>
<td valign="middle" align="center">&lt;0.001</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;4-5.9cm</td>
<td valign="middle" align="center">2.12 (1.99-2.25)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">1.514 (1.41-1.625)</td>
<td valign="middle" align="center">&lt;0.001</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;6-7.9cm</td>
<td valign="middle" align="center">2.46 (2.28-2.65)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">1.722 (1.581-1.875)</td>
<td valign="middle" align="center">&lt;0.001</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;&gt;8cm</td>
<td valign="middle" align="center">2.22 (2.02-2.44)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">1.629 (1.467-1.808)</td>
<td valign="middle" align="center">&lt;0.001</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Unknown</td>
<td valign="middle" align="center">3.01 (2.78-3.26)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">1.439 (1.318-1.572)</td>
<td valign="middle" align="center">&lt;0.001</td>
</tr>
<tr>
<td valign="top" align="left">Surgery_Type: No Surgery</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center"/>
<td valign="middle" align="center"/>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Local or partial pancreatectomy</td>
<td valign="middle" align="center">0.31 (0.3-0.32)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">0.491 (0.45-0.535)</td>
<td valign="middle" align="center">&lt;0.001</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Total pancreatectomy</td>
<td valign="middle" align="center">0.33 (0.31-0.34)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">0.507 (0.462-0.556)</td>
<td valign="middle" align="center">&lt;0.001</td>
</tr>
<tr>
<td valign="top" align="left">Lymph_Nodes_Surgery: No or biopsy only</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center"/>
<td valign="middle" align="center"/>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="top" align="left">&#x2003;1-3 regional lymph nodes removed</td>
<td valign="middle" align="center">0.41 (0.38-0.44)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">0.991 (0.888-1.105)</td>
<td valign="middle" align="center">0.868</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;4 or more regional lymph nodes removed</td>
<td valign="middle" align="center">0.33 (0.32-0.35)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">0.846 (0.761-0.94)</td>
<td valign="middle" align="center">0.002</td>
</tr>
<tr>
<td valign="top" align="left">Regional_Lymph_Nodes: No nodes were examined</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center"/>
<td valign="middle" align="center"/>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Negative</td>
<td valign="middle" align="center">0.25 (0.24-0.27)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">0.709 (0.65-0.774)</td>
<td valign="middle" align="center">&lt;0.001</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Positive</td>
<td valign="middle" align="center">0.41 (0.39-0.42)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">1.03 (0.941-1.128)</td>
<td valign="middle" align="center">0.524</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Unknown</td>
<td valign="middle" align="center">0.71 (0.53-0.94)</td>
<td valign="middle" align="center">0.018</td>
<td valign="middle" align="center">0.914 (0.682-1.225)</td>
<td valign="middle" align="center">0.547</td>
</tr>
<tr>
<td valign="top" align="left">Chemotherapy: None/Unknown</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center"/>
<td valign="middle" align="center"/>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Yes</td>
<td valign="middle" align="center">0.65 (0.63-0.67)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">0.582 (0.562-0.602)</td>
<td valign="middle" align="center">&lt;0.001</td>
</tr>
<tr>
<td valign="top" align="left">Radiotherapy: None/Unknown</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center"/>
<td valign="middle" align="center"/>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Yes</td>
<td valign="middle" align="center">0.69 (0.67-0.71)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">0.905 (0.873-0.938)</td>
<td valign="middle" align="center">&lt;0.001</td>
</tr>
<tr>
<td valign="top" align="left">Metastasis: No</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center"/>
<td valign="middle" align="center"/>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Yes</td>
<td valign="middle" align="center">1.58 (1.54-1.63)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">0.781 (0.709-0.861)</td>
<td valign="middle" align="center">&lt;0.001</td>
</tr>
<tr>
<td valign="top" align="left">Bone_Metastasis: No</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center"/>
<td valign="middle" align="center"/>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Yes</td>
<td valign="middle" align="center">2.82 (2.39-3.33)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">1.196 (1.006-1.422)</td>
<td valign="middle" align="center">0.042</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Unknown</td>
<td valign="middle" align="center">1.19 (1.16-1.23)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">1.186 (0.636-2.21)</td>
<td valign="middle" align="center">0.591</td>
</tr>
<tr>
<td valign="top" align="left">Brain_Metastasis: No</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center"/>
<td valign="middle" align="center"/>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Yes</td>
<td valign="middle" align="center">5.37 (2.23-12.9)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">1.822 (0.747-4.446)</td>
<td valign="middle" align="center">0.187</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Unknown</td>
<td valign="middle" align="center">1.18 (1.15-1.22)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">0.909 (0.498-1.659)</td>
<td valign="middle" align="center">0.756</td>
</tr>
<tr>
<td valign="top" align="left">Liver_Metastasis: No</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center"/>
<td valign="middle" align="center"/>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Yes</td>
<td valign="middle" align="center">2.99 (2.84-3.15)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">1.338 (1.224-1.463)</td>
<td valign="middle" align="center">&lt;0.001</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Unknown</td>
<td valign="middle" align="center">1.34 (1.3-1.39)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">1.753 (1.27-2.419)</td>
<td valign="middle" align="center">0.001</td>
</tr>
<tr>
<td valign="top" align="left">Lung_Metastasis: No</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Yes</td>
<td valign="middle" align="center">2.77 (2.52-3.04)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">1.338 (1.224-1.463)</td>
<td valign="middle" align="center">&lt;0.001</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Unknown</td>
<td valign="middle" align="center">1.22 (1.19-1.26)</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">1.753 (1.27-2.419)</td>
<td valign="middle" align="center">0.001</td>
</tr>
</tbody>
</table>
</table-wrap>
<fig id="f7" position="float">
<label>Figure&#xa0;7</label>
<caption>
<p>Establishment and validation of prognostic model for pancreatic cancer patients. <bold>(A)</bold> A total of 101 kinds of prognostic models via a leave-one-out cross-validation framework and further calculated the C-index of each model. <bold>(B)</bold> Feature selection process by RSF algorithm. <bold>(C)</bold> Model construction by GBM algorithm and visualization of feature importance. <bold>(D)</bold> ROC curves of ML model in training, internal validation and external validation cohorts. <bold>(E)</bold> Time dependent AUC values of ML model in training, internal validation and external validation cohorts. <bold>(F)</bold> Calibration curves of ML model in training, internal validation and external validation cohorts. <bold>(G)</bold> DCA curves of ML model in training, internal validation and external validation cohorts. <bold>(H)</bold> K-M curves of low-risk and high-risk groups divided by ML model in training, internal validation and external validation cohorts. Left: training cohort, Middle: internal validation cohort, Right: external validation cohort.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-14-1488118-g007.tif"/>
</fig>
</sec>
</sec>
<sec id="s4" sec-type="discussion">
<title>Discussion</title>
<p>Pancreatic cancer is among the most invasive and deadly malignancies, with projections suggesting it could become the second leading cause of cancer-related deaths by 2030 (<xref ref-type="bibr" rid="B21">21</xref>). Although radical surgery offers a chance for a cure, high rates of postoperative recurrence and mortality remain a significant concern (<xref ref-type="bibr" rid="B22">22</xref>). Given these challenges, accurately predicting survival rates and identifying prognostic risk factors is of critical importance for pancreatic cancer patients. In this study, we focused on developing novel predictive and prognostic ML models to early predict three-year survival, and to forecast the prognosis of pancreatic cancer patients. By gathering clinical data on several key variables and establishing ML models via benchmark framework, we were able to calculate risk scores related to prediction and prognosis, enabling us to precisely predict the probability of three-year survival and the prognosis of patients. The model analyzes various clinical and demographic features to provide a risk score for three-year survival and prognosis, which helps clinicians determine the intensity and type of treatment required for each patient, outperforming the existing models without ML algorithms (<xref ref-type="bibr" rid="B23">23</xref>, <xref ref-type="bibr" rid="B24">24</xref>).</p>
<p>The clinical importance of this work lies in its potential to enhance patient management and treatment planning for those diagnosed with pancreatic cancer. By providing an accurate risk stratification tool, our model can significantly aid clinicians in making more informed, personalized treatment decisions. For instance, patients identified as high-risk for three-year mortality could be prioritized for aggressive surgical interventions, adjuvant therapies, and closer post-operative monitoring, which may improve their chances of survival. Conversely, patients deemed low-risk could benefit from less intensive treatments, thereby avoiding the potential side effects and complications associated with overtreatment. Additionally, the model&#x2019;s predictions can help the selection of adjuvant therapies, the frequency of follow-up visits, and the need for additional laboratory tests. By integrating the prediction model into clinical workflows, we enable data-driven decision-making that optimizes patient outcomes and resource allocation. As a result, it helps in standardizing care across different healthcare providers and institutions, potentially reducing variability in treatment approaches and outcomes for pancreatic cancer patients.</p>
<p>Moreover, the highlight of our study lies in showcasing how interpretable ML algorithms, particularly through the use of SHAP values, can effectively decipher key factors contributing to predict three-year survival. CatBoost algorithm is a gradient boosting framework based on the symmetric decision tree (oblivious trees) algorithm, which boasts high accuracy and requires fewer parameters, making it efficient and effective in handling categorical features (<xref ref-type="bibr" rid="B25">25</xref>). CatBoost&#x2019;s performance rivals that of other advanced machine learning algorithms, demonstrating its superiority in many applications. But the black-box feature of CatBoost model necessitated its interpretation and explanation with vivid figures. CatBoost&#x2019;s SHAP summary plots and force maps serve as valuable tools, offering clinicians a visual and intuitive means to understand and identify the critical features influencing three-year survival, which not only elucidates the pivotal risk factors but also improves the interpretability of ML models in clinical settings. Meanwhile, several advanced ML techniques, including feature selection through RFECV, hyperparameter optimization with GridSearchCV, and addressing sample imbalance using SMOTE oversampling, had significantly enhanced the prediction accuracy for the probability of three-year survival. Overall, our precise ML prediction model allowed clinicians to schedule personalized treatment plans, helping them tailor therapy methods in time and enhance prognosis of pancreatic cancer patients.</p>
<p>Researchers have previously shown that old age, high histological grade, large tumor size, AJCC stage, surgery type and metastasis are associated with poorer long-term survival outcomes for pancreatic cancer patients (<xref ref-type="bibr" rid="B26">26</xref>, <xref ref-type="bibr" rid="B27">27</xref>). In clinical practice, serum CA199 and CEA levels are commonly used biomarkers in pancreatic cancer, and high levels of CA199 are generally associated with a worse prognosis. Meanwhile, the methylation status of NPTX2, BMP3 and SPARC genes plays an important role in the prognosis of pancreatic cancer. Researchers suggest that methylation of these genes could be used as non-invasive biomarkers to assess prognosis and monitor disease progression in patients with pancreatic cancer (<xref ref-type="bibr" rid="B28">28</xref>). In our analysis, we performed univariate and multivariate logistic and cox regression analyses to discover important predictive factors for three-year survival, as well as independent risk factors for prognosis. Based on clinical variables which can be easily obtained during clinical practices, we succeeded in constructing a powerful CatBoost model to early predict three-year survival.</p>
<p>In our research, we observed that patients with pancreatic cancer who undergo surgical resection demonstrated significantly improved survival rates, as supported by Hester et&#xa0;al.&#x2019;s analysis of the National Cancer Database (<xref ref-type="bibr" rid="B29">29</xref>). However, surgery alone is often insufficient for achieving long-term survival, with median survival times typically ranging between 8 to 10 months, frequently accompanied by tumor recurrence (<xref ref-type="bibr" rid="B30">30</xref>). Chemotherapy, both as a neoadjuvant (preoperative) and adjuvant (postoperative) treatment, has been identified through logistic and cox regression analyses as a key independent factor in enhancing patient survival. Specifically, adjuvant chemotherapy has been shown to double median survival rates compared to patients who do not receive it, while neoadjuvant chemotherapy improves overall survival and increases the likelihood of R0 resection, making it a valuable treatment option (<xref ref-type="bibr" rid="B31">31</xref>). Additionally, age is an independent risk factor, with older patients exhibiting lower survival rates, likely due to diminished immunity and physical decline, which is also common in other types of cancer. Moreover, we found that race does play a role in pancreatic cancer prognosis. African Americans have a higher rate of pancreatic cancer than other racial groups, and their overall survival rate is lower. This difference may be related to a variety of factors, including socioeconomic status, access to and quality of health care, and genetic and environmental factors (<xref ref-type="bibr" rid="B32">32</xref>).</p>
<p>Gender can influence the prognosis of pancreatic cancer, though the impact is complex and varies depending on several factors (<xref ref-type="bibr" rid="B33">33</xref>). Our analysis results show that women generally have a slightly better overall survival (OS) compared to men. This improved survival in women has also been observed in studies analyzing the outcomes of both standard treatments and more aggressive chemotherapy regimens like FOLFIRINOX (<xref ref-type="bibr" rid="B34">34</xref>). Moreover, our analysis displayed that metastasis in pancreatic cancer significantly affected prognosis, with different metastatic sites influencing survival outcomes differently (<xref ref-type="bibr" rid="B35">35</xref>). Common sites of distant metastasis in pancreatic cancer include the peritoneum and liver, followed by the lungs, bones, and other organs (<xref ref-type="bibr" rid="B36">36</xref>). Liver metastasis is the most common and is associated with the poorest prognosis, often due to the liver&#x2019;s role in filtering blood and its involvement in the metabolism of cancer drugs. Lung metastasis, while also serious and crucial, generally presents a slightly better prognosis compared to liver involvement. Peritoneal metastasis reflects a more extensive spread of the disease within the abdominal cavity. This type of metastasis is particularly challenging because it often leads to complications such as ascites (the accumulation of fluid in the abdomen), which can be difficult to manage and severely impacts the patient&#x2019;s quality of life. Overall, the presence of metastasis generally indicates an advanced disease and a poor prognosis, due to the difficulty of achieving complete surgical resection and the challenges in effectively targeting metastatic sites with systemic therapies.</p>
<p>While this study boasts certain strengths, it also faces multiple limitations. Firstly, we calculated the needed sample size for our external validation set, but we were unable to gather a large enough external validation set due to the limited number of patients with complete follow-up information. Although we recognize that large sample sizes improve the reliability of model evaluations, we have tried to collect the largest sample size available in the current research environment. Despite the small set of external validations, we maximize the reliability of validation by using a 10-fold cross-validation approach to assess the model&#x2019;s ability to generalize. In future studies, we plan to increase the sample size of the external validation set, thereby further verifying the universality and reliability of the model. Secondly, our study relies on retrospective datasets sourced from the SEER database, causing possibility of selection bias. Meanwhile, the inconsistent data collection across multiple hospitals, as well as the retrospective study design, led to some missing clinical feature data. Thirdly, the absence of some key clinicopathological parameters is noted, due to the unavailability of image data and laboratory test indicators from the SEER database. The study predominantly utilizes baseline characteristics and routine clinical data as variables, without some important indicators such as CA199, CEA and KRAS gene mutation. To enhance the model&#x2019;s predictive accuracy and identify risk factors, a broad range of features was included, which somewhat complicates its practical application in a clinical setting. Finally, the model has yet to be implemented in clinical practice, thus necessitating prospective, multicenter, and large-scale validations to fully ascertain its generalizability in the future.</p>
</sec>
<sec id="s5" sec-type="conclusions">
<title>Conclusions</title>
<p>In this study, we developed a CatBoost predictive model based on ML benchmark framework, to more accurately predict three-year survival for pancreatic cancer patients, surpassing traditional models in effectiveness and performances. We successfully identified significant predictive factors for three-year survival of pancreatic cancer. Meanwhile, we establish a GBM prognostic model to predict prognosis of pancreatic cancer patients for achieving personalized medicine. This research laid a foundation for future efforts aimed at enhancing three-year survival prediction and prognosis forecasting, which could help clinicians in decision making and therapy plan tailoring.</p>
</sec>
</body>
<back>
<sec id="s6" sec-type="data-availability">
<title>Data availability statement</title>
<p>The raw data supporting the conclusions of this article will be made available by the authors, without undue reservation.</p>
</sec>
<sec id="s7" sec-type="ethics-statement">
<title>Ethics statement</title>
<p>The studies involving humans were approved by Ethics Committee of The First People&#x2019;s Hospital of Lianyungang. The studies were conducted in accordance with the local legislation and institutional requirements. Written informed consent for participation was not required from the participants or the participants&#x2019; legal guardians/next of kin in accordance with the national legislation and institutional requirements. Written informed consent was obtained from the individual(s) for the publication of any potentially identifiable images or data included in this article.</p>
</sec>
<sec id="s8" sec-type="author-contributions">
<title>Author contributions</title>
<p>BT: Data curation, Formal analysis, Investigation, Methodology, Validation, Visualization, Writing &#x2013; original draft. XZ: Data curation, Formal analysis, Investigation, Methodology, Validation, Visualization, Writing &#x2013; original draft. MG: Data curation, Formal analysis, Writing &#x2013; original draft. MM: Data curation, Formal analysis, Writing &#x2013; original draft. WL: Conceptualization, Investigation, Supervision, Writing &#x2013; review &amp; editing. JM: Conceptualization, Investigation, Supervision, Writing &#x2013; review &amp; editing.</p>
</sec>
<sec id="s9" sec-type="funding-information">
<title>Funding</title>
<p>The author(s) declare that no financial support was received for the research, authorship, and/or publication of this article.</p>
</sec>
<ack>
<title>Acknowledgments</title>
<p>We are grateful to the Surveillance, Epidemiology, and End Results (SEER) database for providing data.</p>
</ack>
<sec id="s10" sec-type="COI-statement">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec id="s11" sec-type="disclaimer">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec id="s12" sec-type="supplementary-material">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fonc.2024.1488118/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fonc.2024.1488118/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="DataSheet1.docx" id="SM1" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document"/>
<supplementary-material xlink:href="Table1.xlsx" id="ST1" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<label>1</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Siegel</surname> <given-names>RL</given-names>
</name>
<name>
<surname>Miller</surname> <given-names>KD</given-names>
</name>
<name>
<surname>Wagle</surname> <given-names>NS</given-names>
</name>
<name>
<surname>Jemal</surname> <given-names>A</given-names>
</name>
</person-group>. <article-title>Cancer statistics, 2023</article-title>. <source>CA Cancer J Clin</source>. (<year>2023</year>) <volume>73</volume>:<fpage>17</fpage>&#x2013;<lpage>48</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.3322/caac.21763</pub-id>
</citation>
</ref>
<ref id="B2">
<label>2</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Vincent</surname> <given-names>A</given-names>
</name>
<name>
<surname>Herman</surname> <given-names>J</given-names>
</name>
<name>
<surname>Schulick</surname> <given-names>R</given-names>
</name>
<name>
<surname>Hruban</surname> <given-names>RH</given-names>
</name>
<name>
<surname>Goggins</surname> <given-names>M</given-names>
</name>
</person-group>. <article-title>Pancreatic cancer</article-title>. <source>Lancet</source>. (<year>2011</year>) <volume>378</volume>:<page-range>607&#x2013;20</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/S0140-6736(10)62307-0</pub-id>
</citation>
</ref>
<ref id="B3">
<label>3</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gillen</surname> <given-names>S</given-names>
</name>
<name>
<surname>Schuster</surname> <given-names>T</given-names>
</name>
<name>
<surname>Meyer Zum B&#xfc;schenfelde</surname> <given-names>C</given-names>
</name>
<name>
<surname>Friess and J. Kleeff</surname> <given-names>H</given-names>
</name>
</person-group>. <article-title>Preoperative/neoadjuvant therapy in pancreatic cancer: a systematic review and meta-analysis of response and resection percentages</article-title>. <source>PLoS Med</source>. (<year>2010</year>) <volume>7</volume>:<elocation-id>e1000267</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1371/journal.pmed.1000267</pub-id>
</citation>
</ref>
<ref id="B4">
<label>4</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhao</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>W</given-names>
</name>
</person-group>. <article-title>Pancreatic cancer: A review of risk factors, diagnosis, and treatment</article-title>. <source>Technol Cancer Res Treat</source>. (<year>2020</year>) <volume>19</volume>:<fpage>1533033820962117</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1177/1533033820962117</pub-id>
</citation>
</ref>
<ref id="B5">
<label>5</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>He</surname> <given-names>Q</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>J</given-names>
</name>
</person-group>. <article-title>Targeting KRAS in PDAC: A new way to cure it</article-title>? <source>Cancers (Basel)</source>. (<year>2022</year>) <volume>14</volume>(<issue>20</issue>):<fpage>4982</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/cancers14204982</pub-id>
</citation>
</ref>
<ref id="B6">
<label>6</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tempero</surname> <given-names>MA</given-names>
</name>
<name>
<surname>Malafa</surname> <given-names>MP</given-names>
</name>
<name>
<surname>Chiorean</surname> <given-names>EG</given-names>
</name>
<name>
<surname>Czito</surname> <given-names>B</given-names>
</name>
<name>
<surname>Scaife</surname> <given-names>C</given-names>
</name>
<name>
<surname>Narang</surname> <given-names>AK</given-names>
</name>
<etal/>
</person-group>. <article-title>Pancreatic adenocarcinoma, version 1.2019</article-title>. <source>J Natl Compr Canc Netw</source>. (<year>2019</year>) <volume>17</volume>:<page-range>202&#x2013;10</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.6004/jnccn.2019.0014</pub-id>
</citation>
</ref>
<ref id="B7">
<label>7</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mitchell</surname> <given-names>PS</given-names>
</name>
<name>
<surname>Parkin</surname> <given-names>RK</given-names>
</name>
<name>
<surname>Kroh</surname> <given-names>EM</given-names>
</name>
<name>
<surname>Fritz</surname> <given-names>BR</given-names>
</name>
<name>
<surname>Wyman</surname> <given-names>SK</given-names>
</name>
<name>
<surname>Pogosova-Agadjanyan</surname> <given-names>EL</given-names>
</name>
<etal/>
</person-group>. <article-title>Circulating microRNAs as stable blood-based markers for cancer detection</article-title>. <source>Proc Natl Acad Sci U S A</source>. (<year>2008</year>) <volume>105</volume>:<page-range>10513&#x2013;8</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1073/pnas.0804549105</pub-id>
</citation>
</ref>
<ref id="B8">
<label>8</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chalmers</surname> <given-names>ZR</given-names>
</name>
<name>
<surname>Connelly</surname> <given-names>CF</given-names>
</name>
<name>
<surname>Fabrizio</surname> <given-names>D</given-names>
</name>
<name>
<surname>Gay</surname> <given-names>L</given-names>
</name>
<name>
<surname>Ali</surname> <given-names>SM</given-names>
</name>
<name>
<surname>Ennis</surname> <given-names>R</given-names>
</name>
<etal/>
</person-group>. <article-title>Analysis of 100,000 human cancer genomes reveals the landscape of tumor mutational burden</article-title>. <source>Genome Med</source>. (<year>2017</year>) <volume>9</volume>:<fpage>34</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s13073-017-0424-2</pub-id>
</citation>
</ref>
<ref id="B9">
<label>9</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Collins</surname> <given-names>GS</given-names>
</name>
<name>
<surname>Dhiman</surname> <given-names>P</given-names>
</name>
<name>
<surname>Andaur Navarro</surname> <given-names>CL</given-names>
</name>
<name>
<surname>Ma</surname> <given-names>J</given-names>
</name>
<name>
<surname>Hooft</surname> <given-names>L</given-names>
</name>
<name>
<surname>Reitsma</surname> <given-names>JB</given-names>
</name>
<etal/>
</person-group>. <article-title>Protocol for development of a reporting guideline (TRIPOD-AI) and risk of bias tool (PROBAST-AI) for diagnostic and prognostic prediction model studies based on artificial intelligence</article-title>. <source>BMJ Open</source>. (<year>2021</year>) <volume>11</volume>:<elocation-id>e048008</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1136/bmjopen-2020-048008</pub-id>
</citation>
</ref>
<ref id="B10">
<label>10</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pera</surname> <given-names>M</given-names>
</name>
<name>
<surname>Gibert</surname> <given-names>J</given-names>
</name>
<name>
<surname>Gimeno</surname> <given-names>M</given-names>
</name>
<name>
<surname>Garsot</surname> <given-names>E</given-names>
</name>
<name>
<surname>Eizaguirre</surname> <given-names>E</given-names>
</name>
<name>
<surname>Mir&#xf3;</surname> <given-names>M</given-names>
</name>
<etal/>
</person-group>. <article-title>Machine learning risk prediction model of 90-day mortality after gastrectomy for cancer</article-title>. <source>Ann Surg</source>. (<year>2022</year>) <volume>276</volume>:<page-range>776&#x2013;83</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1097/SLA.0000000000005616</pub-id>
</citation>
</ref>
<ref id="B11">
<label>11</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhuang</surname> <given-names>D</given-names>
</name>
<name>
<surname>Li</surname> <given-names>T</given-names>
</name>
<name>
<surname>Xie</surname> <given-names>H</given-names>
</name>
<name>
<surname>Sheng</surname> <given-names>J</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>X</given-names>
</name>
<name>
<surname>Li</surname> <given-names>X</given-names>
</name>
<etal/>
</person-group>. <article-title>A dynamic nomogram for predicting intraoperative brain bulge during decompressive craniectomy in patients with traumatic brain injury: a retrospective study</article-title>. <source>Int J Surg</source>. (<year>2023</year>) <volume>110</volume>(<issue>2</issue>):<page-range>909&#x2013;20</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1097/JS9.0000000000001348</pub-id>
</citation>
</ref>
<ref id="B12">
<label>12</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Riley</surname> <given-names>RD</given-names>
</name>
<name>
<surname>Debray</surname> <given-names>TPA</given-names>
</name>
<name>
<surname>Collins</surname> <given-names>GS</given-names>
</name>
<name>
<surname>Archer</surname> <given-names>L</given-names>
</name>
<name>
<surname>Ensor</surname> <given-names>J</given-names>
</name>
<name>
<surname>van Smeden</surname> <given-names>M</given-names>
</name>
<etal/>
</person-group>. <article-title>Minimum sample size for external validation of a clinical prediction model with a binary outcome</article-title>. <source>Stat Med</source>. (<year>2021</year>) <volume>40</volume>:<page-range>4230&#x2013;51</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/sim.v40.19</pub-id>
</citation>
</ref>
<ref id="B13">
<label>13</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname> <given-names>K</given-names>
</name>
<name>
<surname>Tian</surname> <given-names>J</given-names>
</name>
<name>
<surname>Zheng</surname> <given-names>C</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>H</given-names>
</name>
<name>
<surname>Ren</surname> <given-names>J</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>Y</given-names>
</name>
<etal/>
</person-group>. <article-title>Interpretable prediction of 3-year all-cause mortality in patients with heart failure caused by coronary heart disease based on machine learning and SHAP</article-title>. <source>Comput Biol Med</source>. (<year>2021</year>) <volume>137</volume>:<fpage>104813</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.compbiomed.2021.104813</pub-id>
</citation>
</ref>
<ref id="B14">
<label>14</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kolde</surname> <given-names>R</given-names>
</name>
<name>
<surname>Laur</surname> <given-names>S</given-names>
</name>
<name>
<surname>Adler</surname> <given-names>P</given-names>
</name>
<name>
<surname>Vilo</surname> <given-names>J</given-names>
</name>
</person-group>. <article-title>Robust rank aggregation for gene list integration and meta-analysis</article-title>. <source>Bioinformatics</source>. (<year>2012</year>) <volume>28</volume>:<page-range>573&#x2013;80</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/bioinformatics/btr709</pub-id>
</citation>
</ref>
<ref id="B15">
<label>15</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lang</surname> <given-names>M</given-names>
</name>
<name>
<surname>Binder</surname> <given-names>M</given-names>
</name>
<name>
<surname>Richter</surname> <given-names>J</given-names>
</name>
<name>
<surname>Schratz</surname> <given-names>P</given-names>
</name>
<name>
<surname>Pfisterer</surname> <given-names>F</given-names>
</name>
<name>
<surname>Coors</surname> <given-names>S</given-names>
</name>
<etal/>
</person-group>. <article-title>mlr3: A modern object-oriented machine learning framework in R</article-title>. <source>J Open Source Software</source>. (<year>2019</year>) <volume>4</volume>:<fpage>1903</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.21105/joss.01903</pub-id>
</citation>
</ref>
<ref id="B16">
<label>16</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname> <given-names>K</given-names>
</name>
<name>
<surname>Tian</surname> <given-names>J</given-names>
</name>
<name>
<surname>Zheng</surname> <given-names>C</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>H</given-names>
</name>
<name>
<surname>Ren</surname> <given-names>J</given-names>
</name>
<name>
<surname>Li</surname> <given-names>C</given-names>
</name>
<etal/>
</person-group>. <article-title>Improving risk identification of adverse outcomes in chronic heart failure using SMOTE+ENN and machine learning</article-title>. <source>Risk Manag Healthc Policy</source>. (<year>2021</year>) <volume>14</volume>:<page-range>2453&#x2013;63</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.2147/RMHP.S310295</pub-id>
</citation>
</ref>
<ref id="B17">
<label>17</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Biecek</surname> <given-names>P</given-names>
</name>
</person-group>. <article-title>Dalex: Explainers for complex predictive models in R</article-title>. <source>J Mach Learn Res</source>. (<year>2018</year>) <volume>19</volume>:<page-range>1&#x2013;5</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.5555/3291125.3309646</pub-id>
</citation>
</ref>
<ref id="B18">
<label>18</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lo</surname> <given-names>YT</given-names>
</name>
<name>
<surname>Liao</surname> <given-names>JC</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>MH</given-names>
</name>
<name>
<surname>Chang</surname> <given-names>CM</given-names>
</name>
<name>
<surname>Li</surname> <given-names>CT</given-names>
</name>
</person-group>. <article-title>Predictive modeling for 14-day unplanned hospital readmission risk by using machine learning algorithms</article-title>. <source>BMC Med Inform Decis Mak</source>. (<year>2021</year>) <volume>21</volume>:<fpage>288</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s12911-021-01639-y</pub-id>
</citation>
</ref>
<ref id="B19">
<label>19</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>L</given-names>
</name>
<name>
<surname>Weng</surname> <given-names>S</given-names>
</name>
<name>
<surname>Guo</surname> <given-names>C</given-names>
</name>
<name>
<surname>Dang</surname> <given-names>Q</given-names>
</name>
<name>
<surname>Xu</surname> <given-names>H</given-names>
</name>
<etal/>
</person-group>. <article-title>Machine learning-based integration develops an immune-derived lncRNA signature for improving outcomes in colorectal cancer</article-title>. <source>Nat Commun</source>. (<year>2022</year>) <volume>13</volume>:<fpage>816</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41467-022-28421-6</pub-id>
</citation>
</ref>
<ref id="B20">
<label>20</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sonabend</surname> <given-names>R</given-names>
</name>
<name>
<surname>Kir&#xe1;ly</surname> <given-names>FJ</given-names>
</name>
<name>
<surname>Bender</surname> <given-names>A</given-names>
</name>
<name>
<surname>Bischl</surname> <given-names>B</given-names>
</name>
<name>
<surname>Lang</surname> <given-names>M</given-names>
</name>
</person-group>. <article-title>mlr3proba: an R package for machine learning in survival analysis</article-title>. <source>Bioinformatics</source>. (<year>2021</year>) <volume>37</volume>:<page-range>2789&#x2013;91</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/bioinformatics/btab039</pub-id>
</citation>
</ref>
<ref id="B21">
<label>21</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rahib</surname> <given-names>L</given-names>
</name>
<name>
<surname>Smith</surname> <given-names>BD</given-names>
</name>
<name>
<surname>Aizenberg</surname> <given-names>R</given-names>
</name>
<name>
<surname>Rosenzweig</surname> <given-names>AB</given-names>
</name>
<name>
<surname>Fleshman</surname> <given-names>JM</given-names>
</name>
<name>
<surname>Matrisian</surname> <given-names>LM</given-names>
</name>
</person-group>. <article-title>Projecting cancer incidence and deaths to 2030: the unexpected burden of thyroid, liver, and pancreas cancers in the United States</article-title>. <source>Cancer Res</source>. (<year>2014</year>) <volume>74</volume>:<page-range>2913&#x2013;21</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1158/0008-5472.CAN-14-0155</pub-id>
</citation>
</ref>
<ref id="B22">
<label>22</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fatima</surname> <given-names>J</given-names>
</name>
<name>
<surname>Schnelldorfer</surname> <given-names>T</given-names>
</name>
<name>
<surname>Barton</surname> <given-names>J</given-names>
</name>
<name>
<surname>Wood</surname> <given-names>CM</given-names>
</name>
<name>
<surname>Wiste</surname> <given-names>HJ</given-names>
</name>
<name>
<surname>Smyrk</surname> <given-names>TC</given-names>
</name>
<etal/>
</person-group>. <article-title>Pancreatoduodenectomy for ductal adenocarcinoma: implications of positive margin on survival</article-title>. <source>Arch Surg</source>. (<year>2010</year>) <volume>145</volume>:<page-range>167&#x2013;72</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1001/archsurg.2009.282</pub-id>
</citation>
</ref>
<ref id="B23">
<label>23</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>You</surname> <given-names>K</given-names>
</name>
<name>
<surname>Lei</surname> <given-names>K</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>X</given-names>
</name>
<name>
<surname>Hu</surname> <given-names>R</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>H</given-names>
</name>
<name>
<surname>Xu</surname> <given-names>J</given-names>
</name>
<etal/>
</person-group>. <article-title>A novel nomogram based on the number of positive lymph nodes can predict the overall survival of patients with pancreatic head cancer after radical surgery</article-title>. <source>World J Surg Oncol</source>. (<year>2024</year>) <volume>22</volume>:<fpage>241</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s12957-024-03519-x</pub-id>
</citation>
</ref>
<ref id="B24">
<label>24</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Peng</surname> <given-names>W</given-names>
</name>
<name>
<surname>Yu</surname> <given-names>X</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>R</given-names>
</name>
<name>
<surname>Nie</surname> <given-names>S</given-names>
</name>
<name>
<surname>Jian</surname> <given-names>X</given-names>
</name>
<name>
<surname>Zeng</surname> <given-names>P</given-names>
</name>
</person-group>. <article-title>Construction and validation of a nomogram for cancer specific survival of postoperative pancreatic cancer based on the SEER and China database</article-title>. <source>BMC Gastroenterol</source>. (<year>2024</year>) <volume>24</volume>:<fpage>104</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s12876-024-03180-4</pub-id>
</citation>
</ref>
<ref id="B25">
<label>25</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname> <given-names>C</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>X</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>S</given-names>
</name>
<name>
<surname>Hu</surname> <given-names>J</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>C</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>X</given-names>
</name>
</person-group>. <article-title>Using CatBoost algorithm to&#xa0;identify middle-aged and elderly depression, national health and nutrition examination survey 2011-2018</article-title>. <source>Psychiatry Res</source>. (<year>2021</year>) <volume>306</volume>:<fpage>114261</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.psychres.2021.114261</pub-id>
</citation>
</ref>
<ref id="B26">
<label>26</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname> <given-names>W</given-names>
</name>
<name>
<surname>Ji</surname> <given-names>L</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>X</given-names>
</name>
<name>
<surname>Zhu</surname> <given-names>S</given-names>
</name>
<name>
<surname>Luo</surname> <given-names>J</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>Y</given-names>
</name>
<etal/>
</person-group>. <article-title>Nomogram predicts risk and prognostic factors for bone metastasis of pancreatic cancer: A population-based analysis</article-title>. <source>Front Endocrinol (Lausanne)</source>. (<year>2021</year>) <volume>12</volume>:<elocation-id>752176</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fendo.2021.752176</pub-id>
</citation>
</ref>
<ref id="B27">
<label>27</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname> <given-names>Q</given-names>
</name>
<name>
<surname>Feng</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Miao</surname> <given-names>R</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>X</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>C</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>Z</given-names>
</name>
</person-group>. <article-title>Prognosis and survival analysis of patients with pancreatic cancer: retrospective experience of a single institution</article-title>. <source>World J Surg Oncol</source>. (<year>2022</year>) <volume>20</volume>:<fpage>11</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s12957-021-02478-x</pub-id>
</citation>
</ref>
<ref id="B28">
<label>28</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Garc&#xed;a-Ortiz</surname> <given-names>MV</given-names>
</name>
<name>
<surname>Cano-Ram&#xed;rez</surname> <given-names>P</given-names>
</name>
<name>
<surname>Toledano-Fonseca</surname> <given-names>M</given-names>
</name>
<name>
<surname>Cano</surname> <given-names>MT</given-names>
</name>
<name>
<surname>Inga-Saavedra</surname> <given-names>E</given-names>
</name>
<name>
<surname>Rodr&#xed;guez-Alonso</surname> <given-names>RM</given-names>
</name>
<etal/>
</person-group>. <article-title>Circulating NPTX2 methylation as a non-invasive biomarker for prognosis and monitoring of metastatic pancreatic cancer</article-title>. <source>Clin Epigenet</source>. (<year>2023</year>) <volume>15</volume>:<fpage>118</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s13148-023-01535-4</pub-id>
</citation>
</ref>
<ref id="B29">
<label>29</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hester</surname> <given-names>CA</given-names>
</name>
<name>
<surname>Augustine</surname> <given-names>MM</given-names>
</name>
<name>
<surname>Choti</surname> <given-names>MA</given-names>
</name>
<name>
<surname>Mansour</surname> <given-names>JC</given-names>
</name>
<name>
<surname>Minter</surname> <given-names>RM</given-names>
</name>
<name>
<surname>Polanco</surname> <given-names>PM</given-names>
</name>
<etal/>
</person-group>. <article-title>Comparative outcomes of adenosquamous carcinoma of the pancreas: An analysis of the National Cancer Database</article-title>. <source>J Surg Oncol</source>. (<year>2018</year>) <volume>118</volume>:<fpage>21</fpage>&#x2013;<lpage>30</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/jso.v118.1</pub-id>
</citation>
</ref>
<ref id="B30">
<label>30</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Groot</surname> <given-names>VP</given-names>
</name>
<name>
<surname>Rezaee</surname> <given-names>N</given-names>
</name>
<name>
<surname>Wu</surname> <given-names>W</given-names>
</name>
<name>
<surname>Cameron</surname> <given-names>JL</given-names>
</name>
<name>
<surname>Fishman</surname> <given-names>EK</given-names>
</name>
<name>
<surname>Hruban</surname> <given-names>RH</given-names>
</name>
<etal/>
</person-group>. <article-title>Patterns, timing, and predictors of recurrence following pancreatectomy for pancreatic ductal adenocarcinoma</article-title>. <source>Ann Surg</source>. (<year>2018</year>) <volume>267</volume>:<page-range>936&#x2013;45</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1097/SLA.0000000000002234</pub-id>
</citation>
</ref>
<ref id="B31">
<label>31</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Luo</surname> <given-names>G</given-names>
</name>
<name>
<surname>Fan</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Gong</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Jin</surname> <given-names>K</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>C</given-names>
</name>
<name>
<surname>Cheng</surname> <given-names>H</given-names>
</name>
<etal/>
</person-group>. <article-title>Characteristics and outcomes of pancreatic cancer by histological subtypes</article-title>. <source>Pancreas</source>. (<year>2019</year>) <volume>48</volume>:<page-range>817&#x2013;22</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1097/MPA.0000000000001338</pub-id>
</citation>
</ref>
<ref id="B32">
<label>32</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jiang</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Zheng</surname> <given-names>X</given-names>
</name>
<name>
<surname>Li</surname> <given-names>M</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>M</given-names>
</name>
</person-group>. <article-title>Improving the prognosis of pancreatic cancer: insights from epidemiology, genomic alterations, and therapeutic challenges</article-title>. <source>Front Med</source>. (<year>2023</year>) <volume>17</volume>:<page-range>1135&#x2013;69</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s11684-023-1050-6</pub-id>
</citation>
</ref>
<ref id="B33">
<label>33</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pijnappel</surname> <given-names>EN</given-names>
</name>
<name>
<surname>Schuurman</surname> <given-names>M</given-names>
</name>
<name>
<surname>Wagner</surname> <given-names>AD</given-names>
</name>
<name>
<surname>de Vos-Geelen</surname> <given-names>J</given-names>
</name>
<name>
<surname>van der Geest</surname> <given-names>LGM</given-names>
</name>
<name>
<surname>de Groot</surname> <given-names>JB</given-names>
</name>
<etal/>
</person-group>. <article-title>Sex, gender and age differences in treatment allocation and survival of patients with metastatic pancreatic cancer: A nationwide study</article-title>. <source>Front Oncol</source>. (<year>2022</year>) <volume>12</volume>:<elocation-id>839779</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fonc.2022.839779</pub-id>
</citation>
</ref>
<ref id="B34">
<label>34</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kim</surname> <given-names>J</given-names>
</name>
<name>
<surname>Ji</surname> <given-names>E</given-names>
</name>
<name>
<surname>Jung</surname> <given-names>K</given-names>
</name>
<name>
<surname>Jung</surname> <given-names>IH</given-names>
</name>
<name>
<surname>Park</surname> <given-names>J</given-names>
</name>
<name>
<surname>Lee</surname> <given-names>JC</given-names>
</name>
<etal/>
</person-group>. <article-title>Gender differences in patients with metastatic pancreatic cancer who received FOLFIRINOX</article-title>. <source>J Pers Med</source>. (<year>2021</year>) <volume>11</volume>(<issue>2</issue>):<fpage>83</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/jpm11020083</pub-id>
</citation>
</ref>
<ref id="B35">
<label>35</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Us&#xf3;n</surname> <given-names>PLSJ</given-names>
</name>
<name>
<surname>Tolentino</surname> <given-names>FDS</given-names>
</name>
<name>
<surname>Santos</surname> <given-names>VM</given-names>
</name>
<name>
<surname>Rother</surname> <given-names>ET</given-names>
</name>
<name>
<surname>Maluf</surname> <given-names>FC</given-names>
</name>
</person-group>. <article-title>The impact of metastatic sites in advanced pancreatic adenocarcinoma, systematic review and meta-analysis of prospective randomized studies</article-title>. <source>PLoS One</source>. (<year>2020</year>) <volume>15</volume>:<elocation-id>e0230060</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1371/journal.pone.0230060</pub-id>
</citation>
</ref>
<ref id="B36">
<label>36</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>He</surname> <given-names>C</given-names>
</name>
<name>
<surname>Huang</surname> <given-names>X</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Lin</surname> <given-names>X</given-names>
</name>
<name>
<surname>Li</surname> <given-names>S</given-names>
</name>
</person-group>. <article-title>The impact of different metastatic patterns on survival in patients with pancreatic cancer</article-title>. <source>Pancreatology</source>. (<year>2021</year>) <volume>21</volume>:<page-range>556&#x2013;63</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.pan.2021.01.014</pub-id>
</citation>
</ref>
</ref-list>
</back>
</article>