<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="2.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Oncol.</journal-id>
<journal-title>Frontiers in Oncology</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Oncol.</abbrev-journal-title>
<issn pub-type="epub">2234-943X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fonc.2023.1105224</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Oncology</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Individual risk and prognostic value prediction by machine learning for distant metastasis in pulmonary sarcomatoid carcinoma: a large cohort study based on the SEER database and the Chinese population</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Yi</surname>
<given-names>Xinglin</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1910088"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Xu</surname>
<given-names>Wenhao</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Tang</surname>
<given-names>Guihua</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Zhang</surname>
<given-names>Lingye</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Wang</surname>
<given-names>Kaishan</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2228102"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Luo</surname>
<given-names>Hu</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="author-notes" rid="fn001">
<sup>*</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/890284"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Zhou</surname>
<given-names>Xiangdong</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="author-notes" rid="fn001">
<sup>*</sup>
</xref>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>Department of Respiratory Medicine, Southwest Hospital of Third Military Medical University</institution>, <addr-line>Chongqing</addr-line>, <country>China</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>Department of Urinary Medicine Center, Southwest Hospital of Third Military Medical University</institution>, <addr-line>Chongqing</addr-line>, <country>China</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>Department of Neurosurgery Department, Southwest Hospital of Third Military Medical University</institution>, <addr-line>Chongqing</addr-line>, <country>China</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>Edited by: Chuanming Li, Chongqing University Central Hospital, China</p>
</fn>
<fn fn-type="edited-by">
<p>Reviewed by: Kathiravan Srinivasan, Vellore Institute of Technology, Vellore, India; Yinlong Yuan, Nantong University, China</p>
</fn>
<fn fn-type="corresp" id="fn001">
<p>*Correspondence: Hu Luo, <email xlink:href="mailto:luohucy@163.com">luohucy@163.com</email>;  Xiangdong Zhou, <email xlink:href="mailto:xiangdongzhou@126.com">xiangdongzhou@126.com</email>
</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>26</day>
<month>06</month>
<year>2023</year>
</pub-date>
<pub-date pub-type="collection">
<year>2023</year>
</pub-date>
<volume>13</volume>
<elocation-id>1105224</elocation-id>
<history>
<date date-type="received">
<day>22</day>
<month>11</month>
<year>2022</year>
</date>
<date date-type="accepted">
<day>06</day>
<month>06</month>
<year>2023</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2023 Yi, Xu, Tang, Zhang, Wang, Luo and Zhou</copyright-statement>
<copyright-year>2023</copyright-year>
<copyright-holder>Yi, Xu, Tang, Zhang, Wang, Luo and Zhou</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<sec>
<title>Background</title>
<p>This study aimed to develop diagnostic and prognostic models for patients with pulmonary sarcomatoid carcinoma (PSC) and distant metastasis (DM).</p>
</sec>
<sec>
<title>Methods</title>
<p>Patients from the Surveillance, Epidemiology, and End Results (SEER) database were divided into a training set and internal test set at a ratio of 7 to 3, while those from the Chinese hospital were assigned to the external test set, to develop the diagnostic model for DM. Univariate logistic regression was employed in the training set to screen for DM-related risk factors, which were included into six machine learning (ML) models. Furthermore, patients from the SEER database were randomly divided into a training set and validation set at a ratio of 7 to 3 to develop the prognostic model which predicts survival of patients PSC with DM. Univariate and multivariate Cox regression analyses have also been performed in the training set to identify independent factors, and a prognostic nomogram for cancer-specific survival (CSS) for PSC patients with DM.</p>
</sec>
<sec>
<title>Results</title>
<p>For the diagnostic model for DM, 589 patients with PSC in the training set, 255 patients in the internal and 94 patients in the external test set were eventually enrolled. The extreme gradient boosting (XGB) algorithm performed best on the external test set with an area under the curve (AUC) of 0.821. For the prognostic model, 270 PSC patients with DM in the training and 117 patients in the test set were enrolled. The nomogram displayed precise accuracy with AUC of 0.803 for 3-month CSS and 0.869 for 6-month CSS in the test set.</p>
</sec>
<sec>
<title>Conclusion</title>
<p>The ML model accurately identified individuals at high risk for DM who needed more careful follow-up, including appropriate preventative therapeutic strategies. The prognostic nomogram accurately predicted CSS in PSC patients with DM.</p>
</sec>
</abstract>
<kwd-group>
<kwd>machine learning</kwd>
<kwd>SEER</kwd>
<kwd>Pulmonary sarcomatoid carcinoma</kwd>
<kwd>risk</kwd>
<kwd>prognosis</kwd>
</kwd-group>
<contract-num rid="cn001">2020FYYX012</contract-num>
<contract-sponsor id="cn001">Science-Health Joint Medical Scientific Research Project of Chongqing<named-content content-type="fundref-id">10.13039/100017501</named-content>
</contract-sponsor>
<counts>
<fig-count count="6"/>
<table-count count="1"/>
<equation-count count="0"/>
<ref-count count="32"/>
<page-count count="10"/>
<word-count count="4335"/>
</counts>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-in-acceptance</meta-name>
<meta-value>Cancer Epidemiology and Prevention</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec id="s1" sec-type="intro">
<label>1</label>
<title>Introduction</title>
<p>Pulmonary sarcomatoid carcinoma (PSC) is rare among all lung malignancies, with an incidence of 0.1&#x2013;0.5% (<xref ref-type="bibr" rid="B1">1</xref>, <xref ref-type="bibr" rid="B2">2</xref>). According to the World Health Organization classification guidelines in 2021, PSC consists of giant cell carcinoma, pleomorphic carcinoma, spindle cell carcinoma, pulmonary blastoma, and carcinosarcoma (<xref ref-type="bibr" rid="B3">3</xref>). Clinically, newly diagnosed patients with PSCs are more likely to be male (77%), smokers (84%), and of advanced age, with a median age of 68 years at diagnosis (<xref ref-type="bibr" rid="B4">4</xref>). Similar to other subtypes of non-small cell lung carcinoma (NSCLC), the initial symptoms of PSC include cough, chest pain, weight loss, and dyspnea (<xref ref-type="bibr" rid="B5">5</xref>).</p>
<p>PSC is a highly aggressive malignancy. Recent studies have reported that the 5-year survival rate ranges from approximately 15% to 20% (<xref ref-type="bibr" rid="B6">6</xref>, <xref ref-type="bibr" rid="B7">7</xref>), which is considerably lower than that in other subtypes of NSCLC. Targeted drugs, especially focusing on mesenchymal-epithelial transition (MET) exon 14 skipping mutations, have been shown to be beneficial in improving the median survival time to 10 months (<xref ref-type="bibr" rid="B8">8</xref>). However, distant metastasis (DM) still results in most patients having a shorter survival time (<xref ref-type="bibr" rid="B9">9</xref>&#x2013;<xref ref-type="bibr" rid="B11">11</xref>). Owing to the rapid invasion into vasculature, 40&#x2013;60% of PSC patients are diagnosed with DM at first presentation (<xref ref-type="bibr" rid="B6">6</xref>, <xref ref-type="bibr" rid="B9">9</xref>, <xref ref-type="bibr" rid="B12">12</xref>). The most common sites of DM are bone (16%), lungs (15%), brain (12%), and liver (8%), while 62% of patients present with multiple DM sites (<xref ref-type="bibr" rid="B13">13</xref>). The 1- and 3-year overall survival (OS) probabilities of PSC patients with DM are reported to be only 14.1% and 5.5%, respectively, which are significantly lower than those of patients without DM (58.2% and 38.1%, respectively) (<xref ref-type="bibr" rid="B13">13</xref>). Therefore, it is of great clinical significance to identify those at risk of developing DM upon initial stage of diagnosis.</p>
<p>Computed tomography (CT), magnetic resonance imaging (MRI), and positron emission tomography-computed tomography (PET-CT) are commonly used diagnostic modalities for screening for DM in newly hospitalized patients with PSC. However, these screening methods are difficult to apply to all hospitalized PSC patients due to their high cost, including time-related costs. Meanwhile, due to its rare incidence, the prognostic factors of PSC patients with DM remain unclear. Consequently, research investigating the factors influencing survival is important as it can inform and guide clinical strategies. Since the emergence of big data analysis and machine learning (ML), it is possible to provide an alternative option for factors screening. There have been several predictive models with outstanding performance being built to apply in clinical practice by using big data and ML (<xref ref-type="bibr" rid="B14">14</xref>&#x2013;<xref ref-type="bibr" rid="B16">16</xref>). The Surveillance, Epidemiology, and End Results (SEER) database (<ext-link ext-link-type="uri" xlink:href="https://seer.cancer.gov/">https://seer.cancer.gov/</ext-link>) covers geographically diverse patients with detailed information on the patients&#x2019; clinicopathological statistics and follow-up visits, providing an abundance of medical cases to analyze. This real-world-based database offers a golden opportunity to develop or examine ML models in this field. However, to our knowledge, no studies have focused on establishing models for the prediction and prognosis of DM in PSC patients.</p>
<p>Therefore, this study aimed to establish and validate diagnostic and prognostic models based on ML algorithms and Cox regression through large population and ML. Additionally, this study aimed to offer personalized predictors that could serve as effective tools for clinicians to preliminarily evaluate the risk and prognosis of PSC with DM, saving patients from unnecessary costs.</p>
</sec>
<sec id="s2" sec-type="materials|methods">
<label>2</label>
<title>Materials and methods</title>
<sec id="s2_1">
<label>2.1</label>
<title>Data source and characteristics</title>
<p>Clinicopathological information of patients with PSC diagnosed between 2004 and 2018 was collected from the SEER database. Additionally, clinicopathological data from Southwest Hospital (2004&#x2013;2022) in China was retrospectively obtained using an electronic medical record system. Inclusion criteria comprised the primary disease site and morphology, based on the 6th Edition of the American Joint Committee on Cancer (AJCC) &#x201c;Lung,&#x201d; with the following International Classification of Diseases for Oncology 3rd Edition (ICD-O-3) codes: 8022/3, 8031/3, 8032/3, 8072/3, or 8980/3. Exclusion criteria comprised patients whose information on laterality, primary site, tumor-node-metastasis (TNM) stage, histology, marital status, and tumor size was unknown; patients with more than one primary malignancy; patients aged &lt;18 years; and patients whose survival time and therapeutic information were unknown. In addition, patients with unknown survival months were excluded from the survival analysis. Finally, a total of 844 patients from the SEER database and 94 patients from Southwest Hospital in China were included in the analysis. For the diagnostic model for DM, 844 patients in the SEER cohort were divided randomly into training and internal test sets in a 7:3 ratio with 589 and 255 cases, respectively. 94 patients from the Southwest Hospital cohort were assigned as the external validation set. For the prognostic model for cancer-specific survival (CSS) of PSC patients with DM, we randomly assigned PSC patients with DM into training and test groups in a 7:3 ratio. As a result, 270 PSC patients with DM were included in the training set, and 117 were included in the validation set. External examination for the prognostic model was not performed for two reasons: first, considerable prognostic information about the PSC patients with DM was censored in our hospital; second, the sample size was too small to satisfy the minimal sample size needed for analysis.</p>
<p>Clinicopathological factors included age, sex, histology, ethnicity, TNM stage, laterality, primary site, marital status, survival time, surgery, chemotherapy, and radiation therapy. Primary T and M staging was adjusted based on tumor size and extension according to the AJCC 8th Edition TNM staging system. Due to the sample limitations, ethnicity was categorized into &#x2018;European&#x2019; and &#x2018;other&#x2019; groups and marital status into &#x2018;married&#x2019; and &#x2018;other&#x2019; groups.</p>
</sec>
<sec id="s2_2">
<label>2.2</label>
<title>Statistical analysis</title>
<p>The overall statistical analysis was performed using software (version 4.2.1). Chi-square tests were used to discern differences in categorical variables, and t-tests were used to compare discrepancies between the continuous variables. All variables were included in the correlation analysis using the Spearman method, which was performed to determine which variables were significant and to exclude confounding variables.</p>
</sec>
<sec id="s2_3">
<label>2.3</label>
<title>Development and evaluation of ML-based diagnostic models for DM</title>
<p>In the preliminary analysis, variables with P &lt; 0.05 in the univariate logistic analysis in the training set were included in the model construction process, which involved the logistic regression (LR), random forest (RF), support vector machine (SVM), extreme gradient boosting (XGB), decision tree (DT), and artificial neural network (ANN) models. The hyperparameters were tuned using 10-fold cross-validation and a grid search procedure to improve the predictive performance and enhance the stability of the ML models. The &#x201c;tidymodels&#x201d; package in R software completed all these development procedures.</p>
<p>Model performance was comprehensively evaluated using the area under the curve (AUC), sensitivity, specificity, and accuracy. In addition, we performed calibration curve and decision curve analysis (DCA) to check the discriminative ability and practical clinical value. The best-performing model was then used to build a web-based calculator to allow access to the model.</p>
</sec>
<sec id="s2_4">
<label>2.4</label>
<title>Establishment and validation of the prognostic nomogram</title>
<p>In the training cohort, a univariate Cox model was used to identify CSS-related independent factors for PSC patients with DM. Variables with P &lt; 0.05 were included in a multivariate Cox analysis. The variables with P &lt; 0.05 in the multivariate Cox regression were incorporated into the prognostic nomogram development to estimate survival probability at 3 and 6 months. The AUC, calibration, and DCA estimators were used to evaluate the nomogram.</p>
</sec>
</sec>
<sec id="s3" sec-type="results">
<label>3</label>
<title>Results</title>
<sec id="s3_1">
<label>3.1</label>
<title>Baseline characteristics and correlation analysis</title>
<p>A total of 589 patients with PSC were included into the training set while 255 PSC patients were included into in the internal test set. 270 patients in the training set and 117 patients in the internal test set were accompanied with DM. In addition, 94 patients whose clinical information was recorded from the Southwest Hospital were assigned to an external test set, among whom 37 patients suffered from DM. The detailed characteristics and discrepancies between the DM and non-DM groups are presented in <xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref>. Patients with DM were observed to be more likely male with advanced T and N stages. In addition, the histology of codes 8031 and 8032, namely giant cell carcinoma and spindle cell carcinoma, respectively, were found to be correlated with a higher proportion of DM. Spearman&#x2019;s correlation analysis suggested that T-stage, N-stage, radiation therapy, and histology were positively correlated with DM, whereas surgery and survival months were negatively correlated. In terms of survival, surgery and chemotherapy were observed to positively influence survival time. In contrast, older age, T stage, N stage, and M stage negatively contributed to survival (<xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1</bold>
</xref>).</p>
<table-wrap id="T1" position="float">
<label>Table&#xa0;1</label>
<caption>
<p>Baseline characteristics.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" align="center">Variables</th>
<th valign="bottom" colspan="2" align="center">Train set</th>
<th valign="bottom" colspan="3" align="center">Internal test set</th>
<th valign="bottom" colspan="2" align="center">External test set</th>
</tr>
<tr>
<th valign="middle" align="center">
</th>
<th valign="middle" align="center">Non-DM<break/>(N = 319)</th>
<th valign="middle" align="center">DM<break/>(N = 270)</th>
<th valign="middle" align="center">Non-DM<break/>(N = 138)</th>
<th valign="middle" align="center" colspan="2">DM<break/>(N = 117)</th>
<th valign="middle" align="center">Non-DM<break/>(N = 57)</th>
<th valign="middle" align="center">DM<break/>(N = 37)</th>
</tr>
</thead>
<tbody>
<tr>
<th valign="middle" colspan="8" align="center">T stage</th>
</tr>
<tr>
<td valign="middle" align="center">T1</td>
<td valign="middle" align="center">45 (14.1%)</td>
<td valign="middle" align="center">14 (5.2%)</td>
<td valign="middle" align="center">30 (21.7%)</td>
<td valign="middle" colspan="2" align="center">8 (6.8%)</td>
<td valign="middle" align="center">16 (28.1%)</td>
<td valign="middle" align="center">3 (8.1%)</td>
</tr>
<tr>
<td valign="middle" align="center">T2</td>
<td valign="middle" align="center">95 (29.8%)</td>
<td valign="middle" align="center">45 (16.7%)</td>
<td valign="middle" align="center">37 (26.8%)</td>
<td valign="middle" colspan="2" align="center">22 (18.8%)</td>
<td valign="middle" align="center">22 (38.6%)</td>
<td valign="middle" align="center">14 (37.8%)</td>
</tr>
<tr>
<td valign="middle" align="center">T3</td>
<td valign="middle" align="center">86 (27.0%)</td>
<td valign="middle" align="center">69 (25.6%)</td>
<td valign="middle" align="center">31 (22.5%)</td>
<td valign="middle" colspan="2" align="center">26 (22.2%)</td>
<td valign="middle" align="center">9 (15.8%)</td>
<td valign="middle" align="center">11 (29.7%)</td>
</tr>
<tr>
<td valign="middle" align="center">T4</td>
<td valign="middle" align="center">93 (29.2%)</td>
<td valign="middle" align="center">142 (52.6%)</td>
<td valign="middle" align="center">40 (29.0%)</td>
<td valign="middle" colspan="2" align="center">61 (52.1%)</td>
<td valign="middle" align="center">10 (17.5%)</td>
<td valign="middle" align="center">9 (24.3%)</td>
</tr>
<tr>
<th valign="middle" colspan="8" align="center">N stage</th>
</tr>
<tr>
<td valign="middle" align="center">N0</td>
<td valign="middle" align="center">202 (63.3%)</td>
<td valign="middle" align="center">86 (31.9%)</td>
<td valign="middle" align="center">83 (60.1%)</td>
<td valign="middle" colspan="2" align="center">41 (35.0%)</td>
<td valign="middle" align="center">40 (70.2%)</td>
<td valign="middle" align="center">9 (24.3%)</td>
</tr>
<tr>
<td valign="middle" align="center">N1</td>
<td valign="middle" align="center">42 (13.2%)</td>
<td valign="middle" align="center">31 (11.5%)</td>
<td valign="middle" align="center">22 (15.9%)</td>
<td valign="middle" colspan="2" align="center">14 (12.0%)</td>
<td valign="middle" align="center">7 (12.3%)</td>
<td valign="middle" align="center">1 (2.7%)</td>
</tr>
<tr>
<td valign="middle" align="center">N2</td>
<td valign="middle" align="center">67 (21.0%)</td>
<td valign="middle" align="center">109 (40.4%)</td>
<td valign="middle" align="center">31 (22.5%)</td>
<td valign="middle" colspan="2" align="center">43 (36.8%)</td>
<td valign="middle" align="center">10 (17.5%)</td>
<td valign="middle" align="center">14 (37.8%)</td>
</tr>
<tr>
<td valign="middle" align="center">N3</td>
<td valign="middle" align="center">8 (2.5%)</td>
<td valign="middle" align="center">44 (16.3%)</td>
<td valign="middle" align="center">2 (1.4%)</td>
<td valign="middle" colspan="2" align="center">19 (16.2%)</td>
<td valign="middle" align="center">0 (0%)</td>
<td valign="middle" align="center">13 (35.1%)</td>
</tr>
<tr>
<th valign="middle" colspan="8" align="center">Histology</th>
</tr>
<tr>
<td valign="middle" align="center">8022</td>
<td valign="middle" align="center">155 (48.6%)</td>
<td valign="middle" align="center">75 (27.8%)</td>
<td valign="middle" align="center">81 (58.7%)</td>
<td valign="middle" colspan="2" align="center">25 (21.4%)</td>
<td valign="middle" align="center">14 (24.6%)</td>
<td valign="middle" align="center">4 (10.8%)</td>
</tr>
<tr>
<td valign="middle" align="center">8031</td>
<td valign="middle" align="center">57 (17.9%)</td>
<td valign="middle" align="center">96 (35.6%)</td>
<td valign="middle" align="center">24 (17.4%)</td>
<td valign="middle" colspan="2" align="center">39 (33.3%)</td>
<td valign="middle" align="center">9 (15.8%)</td>
<td valign="middle" align="center">9 (24.3%)</td>
</tr>
<tr>
<td valign="middle" align="center">8032</td>
<td valign="middle" align="center">90 (28.2%)</td>
<td valign="middle" align="center">95 (35.2%)</td>
<td valign="middle" align="center">29 (21.0%)</td>
<td valign="middle" colspan="2" align="center">50 (42.7%)</td>
<td valign="middle" align="center">20 (35.1%)</td>
<td valign="middle" align="center">15 (40.5%)</td>
</tr>
<tr>
<td valign="middle" align="center">8972</td>
<td valign="middle" align="center">1 (0.3%)</td>
<td valign="middle" align="center">0 (0%)</td>
<td valign="middle" align="center">1 (0.7%)</td>
<td valign="middle" colspan="2" align="center">0 (0%)</td>
<td valign="middle" align="center">5 (8.8%)</td>
<td valign="middle" align="center">4 (10.8%)</td>
</tr>
<tr>
<td valign="middle" align="center">8980</td>
<td valign="middle" align="center">16 (5.0%)</td>
<td valign="middle" align="center">4 (1.5%)</td>
<td valign="middle" align="center">3 (2.2%)</td>
<td valign="middle" colspan="2" align="center">3 (2.6%)</td>
<td valign="middle" align="center">9 (15.8%)</td>
<td valign="middle" align="center">5 (13.5%)</td>
</tr>
<tr>
<th valign="middle" colspan="8" align="center">Sex</th>
</tr>
<tr>
<td valign="middle" align="center">Female</td>
<td valign="middle" align="center">135 (42.3%)</td>
<td valign="middle" align="center">101 (37.4%)</td>
<td valign="middle" align="center">60 (43.5%)</td>
<td valign="middle" colspan="2" align="center">44 (37.6%)</td>
<td valign="middle" align="center">9 (15.8%)</td>
<td valign="middle" align="center">9 (24.3%)</td>
</tr>
<tr>
<td valign="middle" align="center">Male</td>
<td valign="middle" align="center">184 (57.7%)</td>
<td valign="middle" align="center">169 (62.6%)</td>
<td valign="middle" align="center">78 (56.5%)</td>
<td valign="middle" colspan="2" align="center">73 (62.4%)</td>
<td valign="middle" align="center">48 (84.2%)</td>
<td valign="middle" align="center">28 (75.7%)</td>
</tr>
<tr>
<th valign="middle" colspan="8" align="center">Laterality</th>
</tr>
<tr>
<td valign="middle" align="center">Center</td>
<td valign="middle" align="center">136 (42.6%)</td>
<td valign="middle" align="center">116 (43.0%)</td>
<td valign="middle" align="center">54 (39.1%)</td>
<td valign="middle" colspan="2" align="center">57 (48.7%)</td>
<td valign="middle" align="center">31 (54.4%)</td>
<td valign="middle" align="center">14 (37.8%)</td>
</tr>
<tr>
<td valign="middle" align="center">Right</td>
<td valign="middle" align="center">183 (57.4%)</td>
<td valign="middle" align="center">154 (57.0%)</td>
<td valign="middle" align="center">84 (60.9%)</td>
<td valign="middle" colspan="2" align="center">60 (51.3%)</td>
<td valign="middle" align="center">26 (45.6%)</td>
<td valign="middle" align="center">23 (62.2%)</td>
</tr>
<tr>
<th valign="middle" colspan="8" align="center">Primary site</th>
</tr>
<tr>
<td valign="middle" align="center">Lower</td>
<td valign="middle" align="center">95 (29.8%)</td>
<td valign="middle" align="center">81 (30.0%)</td>
<td valign="middle" align="center">29 (21.0%)</td>
<td valign="middle" colspan="2" align="center">40 (34.2%)</td>
<td valign="middle" align="center">18 (31.6%)</td>
<td valign="middle" align="center">14 (37.8%)</td>
</tr>
<tr>
<td valign="middle" align="center">Middle</td>
<td valign="middle" align="center">14 (4.4%)</td>
<td valign="middle" align="center">18 (6.7%)</td>
<td valign="middle" align="center">10 (7.2%)</td>
<td valign="middle" colspan="2" align="center">5 (4.3%)</td>
<td valign="middle" align="center">1 (1.8%)</td>
<td valign="middle" align="center">1 (2.7%)</td>
</tr>
<tr>
<td valign="middle" align="center">Other</td>
<td valign="middle" align="center">20 (6.3%)</td>
<td valign="middle" align="center">15 (5.6%)</td>
<td valign="middle" align="center">4 (2.9%)</td>
<td valign="middle" colspan="2" align="center">7 (6.0%)</td>
<td valign="middle" align="center">/</td>
<td valign="middle" align="center">/</td>
</tr>
<tr>
<td valign="middle" align="center">Upper</td>
<td valign="middle" align="center">190 (59.6%)</td>
<td valign="middle" align="center">156 (57.8%)</td>
<td valign="middle" align="center">95 (68.8%)</td>
<td valign="middle" colspan="2" align="center">65 (55.6%)</td>
<td valign="middle" align="center">38 (66.7%)</td>
<td valign="middle" align="center">22 (59.5%)</td>
</tr>
<tr>
<th valign="middle" colspan="8" align="center">Ethnicity</th>
</tr>
<tr>
<td valign="middle" align="center">Other</td>
<td valign="middle" align="center">23 (7.2%)</td>
<td valign="middle" align="center">23 (8.5%)</td>
<td valign="middle" align="center">12 (8.7%)</td>
<td valign="middle" colspan="2" align="center">9 (7.7%)</td>
<td valign="middle" align="center">57 (100%)</td>
<td valign="middle" align="center">37 (100%)</td>
</tr>
<tr>
<td valign="middle" align="center">European</td>
<td valign="middle" align="center">296 (92.8%)</td>
<td valign="middle" align="center">247 (91.5%)</td>
<td valign="middle" align="center">126 (91.3%)</td>
<td valign="middle" colspan="2" align="center">108 (92.3%)</td>
<td valign="middle" align="center">/</td>
<td valign="middle" align="center">/</td>
</tr>
<tr>
<th valign="middle" colspan="8" align="center">Age</th>
</tr>
<tr>
<td valign="middle" align="center">Mean (SD)</td>
<td valign="middle" align="center">67.4 (11.5)</td>
<td valign="middle" align="center">67.4 (11.4)</td>
<td valign="middle" align="center">66.7 (10.6)</td>
<td valign="middle" colspan="2" align="center">64.5 (12.0)</td>
<td valign="middle" align="center">63.2 (11.8)</td>
<td valign="middle" align="center">65.4 (11.0)</td>
</tr>
<tr>
<th valign="middle" colspan="8" align="center">Marital status</th>
</tr>
<tr>
<td valign="middle" align="center">Married</td>
<td valign="middle" align="center">174 (54.5%)</td>
<td valign="middle" align="center">138 (51.1%)</td>
<td valign="middle" align="center">71 (51.4%)</td>
<td valign="middle" colspan="2" align="center">64 (54.7%)</td>
<td valign="middle" align="center">56 (98.2%)</td>
<td valign="middle" align="center">37 (100%)</td>
</tr>
<tr>
<td valign="middle" align="center">Other</td>
<td valign="middle" align="center">145 (45.5%)</td>
<td valign="middle" align="center">132 (48.9%)</td>
<td valign="middle" align="center">67 (48.6%)</td>
<td valign="middle" colspan="2" align="center">53 (45.3%)</td>
<td valign="middle" align="center">1 (1.8%)</td>
<td valign="middle" align="center">0 (0%)</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>DM, distant metastasis; SD, standard deviation.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<fig id="f1" position="float">
<label>Figure&#xa0;1</label>
<caption>
<p>The heatmap of Spearman&#x2019;s correlation analysis of the baseline characteristics. The correlation index ranges from -1.0 to 1.0, with a brighter color indicating a stronger correlation.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-13-1105224-g001.tif"/>
</fig>
</sec>
<sec id="s3_2">
<label>3.2</label>
<title>Establishment and performance of diagnostic ML models for DM</title>
<p>The univariate logistic regression analysis (<xref ref-type="supplementary-material" rid="SF1">
<bold>Supplementary Figure&#xa0;1</bold>
</xref>), showed that T-stage, N-stage, and histology were variables with P-values &lt; 0.05 and were therefore included in the ML models. In addition, the multivariate analysis (<xref ref-type="supplementary-material" rid="SF2">
<bold>Supplementary Figure&#xa0;2</bold>
</xref>) showed that the N3 stage, T4 stage, N2 stage, histology of 8031, T3 stage, and histology of 8032 (arranged from high to low according to odds ratios [ORs]) were identified as significant factors contributing to DM. Six ML learning algorithms were established by incorporating the above selection of variables, comprising logistic regression (LR), extreme gradient boosting (XGB), random forest (RF), support vector machine (SVM), decision tree (DT), and artificial neural network (ANN) algorithms. Hyperparameters were fine-tuned by performing 10-cross validation and grid searches. Finally, LR, ANN, and XGB were found to have the highest AUC in the internal test set (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2</bold>
</xref>) while the XGB algorithm outperformed the others with the highest AUC of 0.821 in the external test set. The best hyperparameter metric was eta, 0.007; max_depth, 1L; gamma, 0.011; colsample_bytree, 1; colsample_bynode, 0.231; min_child_weight, 8L; and subsample, 0.997.</p>
<fig id="f2" position="float">
<label>Figure&#xa0;2</label>
<caption>
<p>The performance of six ML models in terms of AUC, accuracy, sensitivity, and specificity. ANN, artificial neural network; AUC, area under the curve; DT, decision tree; LR, logistic regression; ML, machine learning; RF, random forest; SVM, support vector machine; XGB, extreme gradient boosting.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-13-1105224-g002.tif"/>
</fig>
<p>As illustrated in <xref ref-type="fig" rid="f3">
<bold>Figures&#xa0;3A&#x2013;C</bold>
</xref>, the AUC differed slightly in the training set and the internal test set among the six ML algorithms; however, in the external test set, XGB performed the best. Calibration plots (<xref ref-type="fig" rid="f3">
<bold>Figures&#xa0;3D&#x2013;F</bold>
</xref>) showed that ML algorithms had a good fitting ability, except for the ANN model, which meant that the ML algorithms accurately predicted the outcome. DCA curves (<xref ref-type="fig" rid="f3">
<bold>Figures&#xa0;3G&#x2013;I</bold>
</xref>) suggested that ML algorithms had a high clinical application value and could effectively help diagnose DM.</p>
<fig id="f3" position="float">
<label>Figure&#xa0;3</label>
<caption>
<p>The clinical applicative performance of six ML models. Receiver operating characteristic curves of six ML models in the training set <bold>(A)</bold>, the internal test set <bold>(B)</bold>, and the external test set <bold>(C)</bold>. Calibration curves of six ML models in the training set <bold>(D)</bold>, the internal test set <bold>(E)</bold> and the external test set <bold>(F)</bold>. Decision curve analysis of six ML models in the training set <bold>(G)</bold>, the internal test set <bold>(H)</bold>, and the external test set <bold>(I)</bold>.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-13-1105224-g003.tif"/>
</fig>
</sec>
<sec id="s3_3">
<label>3.3</label>
<title>Web-based predicator publication</title>
<p>An online calculator based on the XGB model was successfully built (<xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4</bold>
</xref>), which performed the best among the other models. This web-based tool can be readily accessed at <ext-link ext-link-type="uri" xlink:href="https://onepiece.shinyapps.io/PSCdistant/">https://onepiece.shinyapps.io/PSCdistant/</ext-link>. This tool encompassed three simple clinical variables and could help clinicians accurately and conveniently identify those at risk for DM among patients with PSC.</p>
<fig id="f4" position="float">
<label>Figure&#xa0;4</label>
<caption>
<p>Web-based calculator online for free, based on the XGB model. XGB, extreme gradient boosting.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-13-1105224-g004.tif"/>
</fig>
</sec>
<sec id="s3_4">
<label>3.4</label>
<title>Prognostic nomogram establishment and performance</title>
<p>In the prognostic analysis, 270 PSC patients with DM in the training and 117 patients in the test set were enrolled. As shown in <xref ref-type="supplementary-material" rid="SF3">
<bold>Supplementary Figure&#xa0;3</bold>
</xref>, the univariate Cox regression analysis indicated that the T4 stage (P = 0.013), N2 stage (P = 0.048), N3 stage (P = 0.001), upper site (P = 0.023), surgery (P = 0.013), chemotherapy (P &lt; 0.001), and radiation therapy (P &lt; 0.001) were significantly associated with prognosis in PSC patients with DM. After performing multivariate Cox analysis (<xref ref-type="supplementary-material" rid="SF4">
<bold>Supplementary Figure&#xa0;4</bold>
</xref>), stage T4 (P = 0.005), T3 (P = 0.034), N3 (P = 0.002), N2 (P = 0.005), and upper site (P = 0.01) were found to be independent adverse prognostic factors, whereas radiation therapy (P = 0.004), surgery (P = 0.004), and chemotherapy (P &lt; 0.001) were protective prognostic factors for PSC patients with DM. We developed a prognostic nomogram based on these independent variables, to predict the CSS-related survival probability at 3 and 6 months (<xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5</bold>
</xref>). The CSS-related AUC values at 3 and 6 months were 0.810 and 0.822 in the training set (<xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6A</bold>
</xref>) and 0.803 and 0.869 in the test set (<xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6B</bold>
</xref>), respectively, suggesting high predictive accuracy. In addition, calibration (<xref ref-type="fig" rid="f6">
<bold>Figures&#xa0;6C&#x2013;F</bold>
</xref>) and DCA curves (<xref ref-type="fig" rid="f6">
<bold>Figures&#xa0;6G, H</bold>
</xref>) showed the prognostic nomogram&#x2019;s good fitting ability and clinical application.</p>
<fig id="f5" position="float">
<label>Figure&#xa0;5</label>
<caption>
<p>A prognostic nomogram to evaluate 3- and 6-month CSS-related survival probabilities for PSC patients with DM. Note: Drawing a vertical line from each line of the parameters to the &#x201c;points&#x201d; axis can be used to acquire the points for each variable. Then, the total score can be obtained by adding all the points for each independent variable. Finally, by drawing a vertical line from the &#x201c;total score&#x201d; axis to the survival probability line, the individual survival probability at 3 and 6 months can be calculated, and the risk level can be obtained. DM, distant metastases; PSC, pulmonary sarcomatoid carcinoma. *P&lt;0.05; **P&lt;0.01; ***P&lt;0.001.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-13-1105224-g005.tif"/>
</fig>
<fig id="f6" position="float">
<label>Figure&#xa0;6</label>
<caption>
<p>Clinical applicative performance of the prognostic nomogram. Receiver operating characteristic curves at 3 and 6 months in training <bold>(A)</bold> and test sets <bold>(B)</bold>. Calibration plots at 3 months <bold>(C)</bold> and 6 months <bold>(D)</bold> in the training set. Calibration plots at 3 months <bold>(E)</bold> and 6 months <bold>(F)</bold> in the test set. Decision clinical analysis at 3 and 6 months in the training <bold>(G)</bold> and test sets <bold>(H)</bold>.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-13-1105224-g006.tif"/>
</fig>
</sec>
</sec>
<sec id="s4" sec-type="discussion">
<label>4</label>
<title>Discussion</title>
<p>PSC presents a rare lung malignancy with a high probability for DM. Several studies having reported that DM is an independent risk factor for PSC (<xref ref-type="bibr" rid="B6">6</xref>, <xref ref-type="bibr" rid="B17">17</xref>, <xref ref-type="bibr" rid="B18">18</xref>). In this study, approximately 45.2% patients had DM at initial presentation, similar to that reported by Zombori-T&#xf3;th and Terra (<xref ref-type="bibr" rid="B19">19</xref>, <xref ref-type="bibr" rid="B20">20</xref>). The high rate of DM may be attributed to its capacity to invade into vasculature and the high likelihood of DM recurrence. Lococo et&#xa0;al. analyzed the pathological results of 143 patients and found the high incidences of lymphatic (30%) and vascular emboli (68%) (<xref ref-type="bibr" rid="B21">21</xref>). Liang et&#xa0;al. found that MET mutations were commonly expressed in PSCs with a high rate of 16% (<xref ref-type="bibr" rid="B22">22</xref>), whereas the incidence of KRAS mutations was 22%. Similarly, Liu et&#xa0;al. have identified that eight out of 36 (22%) patients harboring MET mutations (<xref ref-type="bibr" rid="B23">23</xref>). This incidence was considerably more frequent than that in other NSCLC subtypes (3%) (<xref ref-type="bibr" rid="B24">24</xref>). A study on 77 Chinese patients with PSC indicated that positive METex14 skipping mutations rate was 20.8%, leading to worse disease-free survival (DFS) (<xref ref-type="bibr" rid="B25">25</xref>). In recent years, immune checkpoint inhibitors (ICIs) and targeted drugs for MET exon 14 skipping mutations have exhibited satisfying benefits in improving patient survival (<xref ref-type="bibr" rid="B6">6</xref>, <xref ref-type="bibr" rid="B26">26</xref>, <xref ref-type="bibr" rid="B27">27</xref>). However, patients who developed DM still had a significantly worse prognosis. Thus, early attention to DM is important to improve prognosis and help clinicians make the most optional targeted therapeutic decision.</p>
<p>CT, MRI, and PET-CT are conventional radiological screening methods for patients with NSCLC. However, performing all these radiological examinations is costly for newly diagnosed patients. In addition, time-consuming screening processes and potential side effects can delay the patients&#x2019; course from diagnosis to therapy. Therefore, there is an urgent need for a noninvasive, precise, and rapid method to assist in identifying potential DM at the initial hospitalization stage and to estimate the prognosis for PSC patients with DM. In this study, six ML algorithms for predicting DM in patients with PSC and a nomogram for evaluating the prognosis for those with DM were developed. An automatic calculator based on the best-performing algorithm was created and published online for public access. Moreover, the prognostic nomogram could accurately identify risk factors in PSC patients with DM and help clinicians evaluate survival.</p>
<p>Few studies have identified the risk factors for DM in patients with PSC due to its rarity. Logistic regression analysis was performed and found that histologic subtype, T stage, and N stage were independent risk factors for DM in patients with PSC. Among these factors, the N3 stage was most correlated with DM. Patients with the N3 stage had the highest OR of 9.72 (P &lt; 0.001), followed by the T4 stage (OR 4.30, P &lt; 0.001), N2 stage (OR 3.09, P&#xa0;&lt; 0.001), giant cell carcinoma (OR 2.56, P &lt; 0.001), T3 stage (OR 2.36, P = 0.022), and spindle cell carcinoma (OR 2.12, P &lt; 0.001). These findings were similar to those reported by Xiao et&#xa0;al., who retrospectively analyzed 934 PSC patients using the SEER program database and reported that spindle cell carcinoma (OR 3.151, P &lt; 0.001) and giant cell carcinoma (OR 4.023, P &lt; 0.001) were independent risk factors for DM (<xref ref-type="bibr" rid="B13">13</xref>).</p>
<p>Similarly, T-stage and N-stage have been reported as risk factors for DM in lung adenocarcinoma and squamous cell carcinoma (<xref ref-type="bibr" rid="B28">28</xref>, <xref ref-type="bibr" rid="B29">29</xref>). The two variables have also been identified as important factors for the development of DM in patients with PSC (<xref ref-type="bibr" rid="B28">28</xref>, <xref ref-type="bibr" rid="B29">29</xref>). These three clinical features were then incorporated into the building procedures of the six ML models. The XGB model performed better than the other algorithms, with an AUC of 0.821, showing excellent predictive ability for DM in patients with PSC. In addition, calibration and DCA curves indicated that the model was highly consistent with actual observations and showed better clinical applicability (<xref ref-type="bibr" rid="B30">30</xref>).</p>
<p>Carcinoembryonic antigen levels, cytokeratin 19 fragment (CYFRA21-1), and other serologic indicators which were associated with DM in patients with NSCLC (<xref ref-type="bibr" rid="B31">31</xref>, <xref ref-type="bibr" rid="B32">32</xref>) have not been included in this study due to missing data in the SEER program. However, the relatively high accuracy of the XGB algorithm still helped identify those PSC patients with a high risk for DM. To facilitate the use of the ML predictor, a web-based calculator was developed, which is likely to help clinicians detect DM early in patients with PSC in a convenient manner.</p>
<p>Compared to other subtypes of NSCLC, PSC is less sensitive to chemoradiotherapy. However, studies have confirmed that chemoradiotherapy significantly prolonged the CSS of PSC patients with DM. Xiao et&#xa0;al. analyzed the prognostic risk factors of 512 patients with metastatic PSC diagnosed between 1975 and 2016 in the SEER program (<xref ref-type="bibr" rid="B13">13</xref>). They found that having received chemotherapy (HR 0.308, P &lt; 0.001) was an independent prognostic risk factor for PSC patients with DM, which was similar to our study findings (HR 0.29, P &lt; 0.001). However, they did not identify radiation therapy and surgical resection as independent prognostic factors for PSC patients with DM, while these two therapies were indicated to prolong CSS significantly in our study. We speculate that this discrepancy was due to diagnosis time of the enrolled patients were prior to the year 2000 while surgical and radiation techniques were not so effective. Our study identified T-stage and N-stage as important prognostic risk factors for PSC patients with DM. Advanced T stage (T4, HR 2.52, P = 0.005; T3, HR 2.10, P = 0.03) and N-stage (N3, HR 1.88, P = 0.002; N2, HR 1.60, P = 0.005) correlated with poor CSS in PSC patients suffered from DM.</p>
<p>Interestingly, we have also found that the nodule site appeared to affect the prognosis for PSC patients with DM. CSS was longer in patients whose primary site was located on an upper rather than a lower lobe (HR, 0.68; P = 0.011). The reason may be that the nodules on the lower lung will develop more DM lesions leading a worse prognosis (<xref ref-type="bibr" rid="B13">13</xref>). Notably, we established a nomogram for predicting the prognosis for PSC patients with DM, with a relative higher AUC at 3 months and 6 months respectively. Its high consistency to actual observations indicates that this nomogram could precisely predict CSS in PSC patients with DM.</p>
<p>There are some limitations in our present study. First, this was a retrospective study, and selective bias could not be avoided. Second, characteristic information about DM was collected during initial hospitalization, which may have led to an underestimated percentage of DM in patients with PSC. Lastly, the predictive model was externally validated using patients&#x2019; information from Southwest Hospital in China. However, since this hospital mainly treats Chinese patients, the model&#x2019;s application value should be further validated in cohorts involving differing ethnicities.</p>
</sec>
<sec id="s5" sec-type="conclusions">
<label>5</label>
<title>Conclusion</title>
<p>Our study indicated that PSC patients with advanced T-stage, N-stage, histology of giant cell carcinoma and spindle cell carcinoma were risk factors for DM and should receive more attention in terms of preventative therapeutic strategies. The AUC, accuracy, sensitivity, and specificity of the XGB model reached 0.821, 0.755, 0.757, and 0.754, respectively. A diagnostic model for DM based on the ML algorithm and a web-based predictor was then established, which could conveniently and precisely predict the risk of DM in PSC patients. Our study provided initial predictive and prognostic models for PSC patients with DM. Future studies may focus on further improving the models by adding other potential variables and developing more detailed models to predict the risk and prognosis for specific metastatic sites.</p>
</sec>
<sec id="s6" sec-type="data-availability">
<title>Data availability statement</title>
<p>The datasets presented in this study can be found in online repositories. The names of the repository/repositories and accession number(s) can be found in the article/<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Material</bold>
</xref>.</p>
</sec>
<sec id="s7" sec-type="ethics-statement">
<title>Ethics statement</title>
<p>The studies involving human participants were reviewed and approved by Southwest Hospital, Third Military Medicine University. Written informed consent for participation was not required for this study in accordance with the national legislation and the institutional requirements.</p>
</sec>
<sec id="s8" sec-type="author-contributions">
<title>Author contributions</title>
<p>XY and WX designed the study. GT, LZ, and KW collected the primary data. XY drafted the manuscript. HL and XZ reviewed and edited the paper. All authors contributed to the article and approved the submitted version.</p>
</sec>
</body>
<back>
<sec id="s9" sec-type="funding-information">
<title>Funding</title>
<p>This study was supported by Chongqing Medical Scientific Research Project (No. 2020FYYX012 and No. 2020jstg016).</p>
</sec>
<ack>
<title>Acknowledgments</title>
<p>We sincerely acknowledge all authors who contributed to establishing effective R packages and to Editors who helped to check for and correct grammatical errors in this work.</p>
</ack>
<sec id="s10" sec-type="COI-statement">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec id="s11" sec-type="disclaimer">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec id="s12" sec-type="supplementary-material">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fonc.2023.1105224/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fonc.2023.1105224/full#supplementary-material</ext-link>
</p>
<supplementary-material xlink:href="DataSheet_1.csv" id="SM1" mimetype="text/csv"/>
<supplementary-material xlink:href="DataSheet_2.csv" id="SM2" mimetype="text/csv"/>
<supplementary-material xlink:href="Image_1.tif" id="SF1" mimetype="image/tiff">
<label>Supplementary Figure&#xa0;1</label>
<caption>
<p>The Forest plot of the univariate logistic regression analysis. OR, odds ratio.</p>
</caption>
</supplementary-material>
<supplementary-material xlink:href="Image_2.tif" id="SF2" mimetype="image/tiff">
<label>Supplementary Figure&#xa0;2</label>
<caption>
<p>Forest plot of multivariate logistic regression analysis. The OR value decreases from top to bottom.</p>
</caption>
</supplementary-material>
<supplementary-material xlink:href="Image_3.tif" id="SF3" mimetype="image/tiff">
<label>Supplementary Figure&#xa0;3</label>
<caption>
<p>The Forest plot of the univariate Cox proportional hazards regression analysis. HR, hazard ratio.</p>
</caption>
</supplementary-material>
<supplementary-material xlink:href="Image_4.tif" id="SF4" mimetype="image/tiff">
<label>Supplementary Figure&#xa0;4</label>
<caption>
<p>The Forest plot of the multivariate Cox proportional hazards regression analysis. The HR value is in descending order from top to bottom.</p>
</caption>
</supplementary-material>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<label>1</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Travis</surname> <given-names>WD</given-names>
</name>
<name>
<surname>Brambilla</surname> <given-names>E</given-names>
</name>
<name>
<surname>Burke</surname> <given-names>AP</given-names>
</name>
<name>
<surname>Marx</surname> <given-names>A</given-names>
</name>
<name>
<surname>Nicholson</surname> <given-names>AG</given-names>
</name>
</person-group>. <article-title>Introduction to the 2015 world health organization classification of tumors of the lung, pleura, thymus, and heart</article-title>. <source>J Thorac Oncol</source> (<year>2015</year>) <volume>10</volume>(<issue>9</issue>):<page-range>1240&#x2013;2</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1097/JTO.000-0000000000663</pub-id>
</citation>
</ref>
<ref id="B2">
<label>2</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>L</given-names>
</name>
<name>
<surname>Jiang</surname> <given-names>J</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>H</given-names>
</name>
<name>
<surname>Cao</surname> <given-names>L</given-names>
</name>
<name>
<surname>Gu</surname> <given-names>Q</given-names>
</name>
<etal/>
</person-group>. <article-title>Clinical characteristics and prognostic analysis of 38 patients with pulmonary sarcomatoid carcinoma</article-title>. <source>Chin J Lung Cancer</source> (<year>2015</year>) <volume>18</volume>(<issue>9</issue>):<page-range>537&#x2013;42</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.3779/j.issn.1009-3419.2015.09.02</pub-id>
</citation>
</ref>
<ref id="B3">
<label>3</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ung</surname> <given-names>M</given-names>
</name>
<name>
<surname>Rouquette</surname> <given-names>I</given-names>
</name>
<name>
<surname>Filleron</surname> <given-names>T</given-names>
</name>
<name>
<surname>Taillandy</surname> <given-names>K</given-names>
</name>
<name>
<surname>Brouchet</surname> <given-names>L</given-names>
</name>
<name>
<surname>Bennouna</surname> <given-names>J</given-names>
</name>
<etal/>
</person-group>. <article-title>Characteristics and clinical outcomes of sarcomatoid carcinoma of the lung</article-title>. <source>Clin Lung Cancer</source> (<year>2016</year>) <volume>17</volume>(<issue>5</issue>):<page-range>391&#x2013;7</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.cllc.2016.03.001</pub-id>
</citation>
</ref>
<ref id="B4">
<label>4</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sun</surname> <given-names>L</given-names>
</name>
<name>
<surname>Dai</surname> <given-names>J</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Duan</surname> <given-names>L</given-names>
</name>
<name>
<surname>He</surname> <given-names>W</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>Q</given-names>
</name>
<etal/>
</person-group>. <article-title>Pulmonary sarcomatoid carcinoma: experience from SEER database and shanghai pulmonary hospital</article-title>. <source>Ann Thorac Surg</source> (<year>2020</year>) <volume>110</volume>(<issue>2</issue>):<page-range>406&#x2013;13</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.athoracsur.2020.02.071</pub-id>
</citation>
</ref>
<ref id="B5">
<label>5</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Vieira</surname> <given-names>T</given-names>
</name>
<name>
<surname>Antoine</surname> <given-names>M</given-names>
</name>
<name>
<surname>Ruppert</surname> <given-names>A-M</given-names>
</name>
<name>
<surname>Fallet</surname> <given-names>V</given-names>
</name>
<name>
<surname>Duruisseaux</surname> <given-names>M</given-names>
</name>
<name>
<surname>Giroux Leprieur</surname> <given-names>E</given-names>
</name>
<etal/>
</person-group>. <article-title>Blood vessel invasion is a major feature and a factor of poor prognosis in sarcomatoid carcinoma of the lung</article-title>. <source>Lung Cancer</source> (<year>2014</year>) <volume>85</volume>:<page-range>276&#x2013;81</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.lungcan.2014.06.004</pub-id>
</citation>
</ref>
<ref id="B6">
<label>6</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liang</surname> <given-names>L</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>C</given-names>
</name>
<name>
<surname>Xie</surname> <given-names>S</given-names>
</name>
</person-group>. <article-title>Adjuvant chemotherapy is not a decisive factor in improving the overall survival of pulmonary sarcoma: a population-based study</article-title>. <source>Front Oncol</source> (<year>2022</year>) <volume>12</volume>:<elocation-id>940839</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fonc.2022.940839</pub-id>
</citation>
</ref>
<ref id="B7">
<label>7</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zheng</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Fu</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Zhong</surname> <given-names>Q</given-names>
</name>
<name>
<surname>Deng</surname> <given-names>R</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>Y</given-names>
</name>
</person-group>. <article-title>The treatment of advanced pulmonary sarcomatoid carcinoma</article-title>. <source>Future Oncol</source> (<year>2022</year>) <volume>18</volume>:<page-range>727&#x2013;38</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.2217/fon-2021-1071</pub-id>
</citation>
</ref>
<ref id="B8">
<label>8</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gong</surname> <given-names>C</given-names>
</name>
<name>
<surname>Xiong</surname> <given-names>H</given-names>
</name>
<name>
<surname>Qin</surname> <given-names>K</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>J</given-names>
</name>
<name>
<surname>Cheng</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Zhao</surname> <given-names>J</given-names>
</name>
<etal/>
</person-group>. <article-title>MET alterations in advanced pulmonary sarcomatoid carcinoma</article-title>. <source>Front Oncol</source> (<year>2022</year>). doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fonc.2022.1017026</pub-id>
</citation>
</ref>
<ref id="B9">
<label>9</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Park</surname> <given-names>JS</given-names>
</name>
<name>
<surname>Lee</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Han</surname> <given-names>J</given-names>
</name>
<name>
<surname>Kim</surname> <given-names>HK</given-names>
</name>
<name>
<surname>Choi</surname> <given-names>YS</given-names>
</name>
<name>
<surname>Kim</surname> <given-names>J</given-names>
</name>
<etal/>
</person-group>. <article-title>Clinicopathologic outcomes of curative resection for sarcomatoid carcinoma of the lung</article-title>. <source>Oncology</source> (<year>2011</year>) <volume>81</volume>:<page-range>206&#x2013;13</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1159/000333095</pub-id>
</citation>
</ref>
<ref id="B10">
<label>10</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Weissferdt</surname> <given-names>A</given-names>
</name>
</person-group>. <article-title>Pulmonary sarcomatoid carcinomas: a review</article-title>. <source>Adv Anat Pathol</source> (<year>2018</year>) <volume>25</volume>:<page-range>304&#x2013;13</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1097/PAP.0000000000000202</pub-id>
</citation>
</ref>
<ref id="B11">
<label>11</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yendamuri</surname> <given-names>S</given-names>
</name>
<name>
<surname>Caty</surname> <given-names>L</given-names>
</name>
<name>
<surname>Pine</surname> <given-names>M</given-names>
</name>
<name>
<surname>Adem</surname> <given-names>S</given-names>
</name>
<name>
<surname>Bogner</surname> <given-names>P</given-names>
</name>
<name>
<surname>Miller</surname> <given-names>A</given-names>
</name>
<etal/>
</person-group>. <article-title>Outcomes of sarcomatoid carcinoma of the lung: a surveillance, epidemiology, and end results database analysis</article-title>. <source>Surgery</source> (<year>2012</year>) <volume>152</volume>:<fpage>397</fpage>&#x2013;<lpage>402</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.surg.2012.05.007</pub-id>
</citation>
</ref>
<ref id="B12">
<label>12</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Smadhi</surname> <given-names>H</given-names>
</name>
<name>
<surname>Boudaya</surname> <given-names>MS</given-names>
</name>
<name>
<surname>Abdannadher</surname> <given-names>M</given-names>
</name>
<name>
<surname>BenAbdelghaffar</surname> <given-names>H</given-names>
</name>
<name>
<surname>Kamoun</surname> <given-names>H</given-names>
</name>
<name>
<surname>Ayadi</surname> <given-names>A</given-names>
</name>
<etal/>
</person-group>. <article-title>Pulmonary sarcomatoid carcinoma: a surgical diagnosis and prognostic factors</article-title>. <source>Tunis Med</source> (<year>2019</year>) <volume>97</volume>:<page-range>128&#x2013;32</page-range>.</citation>
</ref>
<ref id="B13">
<label>13</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xiao</surname> <given-names>C</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>X</given-names>
</name>
<name>
<surname>Hao</surname> <given-names>J</given-names>
</name>
<name>
<surname>Guo</surname> <given-names>C</given-names>
</name>
<name>
<surname>Pu</surname> <given-names>Q</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>L</given-names>
</name>
</person-group>. <article-title>Clinicopathological features and prognostic analysis of metastatic pulmonary sarcomatoid carcinoma: a SEER analysis</article-title>. <source>J Thorac Dis</source> (<year>2021</year>) <volume>13</volume>:<fpage>893</fpage>&#x2013;<lpage>905</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.21037/jtd-20-2826</pub-id>
</citation>
</ref>
<ref id="B14">
<label>14</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Du</surname> <given-names>M</given-names>
</name>
<name>
<surname>Haag</surname> <given-names>DG</given-names>
</name>
<name>
<surname>Lynch</surname> <given-names>JW</given-names>
</name>
<name>
<surname>Mittinty</surname> <given-names>MN</given-names>
</name>
</person-group>. <article-title>Comparison of the tree-based machine learning algorithms to cox regression in predicting the survival of oral and pharyngeal cancers: analyses based on SEER database</article-title>. <source>Cancers (Basel)</source> (<year>2020</year>) <volume>12</volume>:<elocation-id>2802</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/cancers12102802</pub-id>
</citation>
</ref>
<ref id="B15">
<label>15</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lee</surname> <given-names>C</given-names>
</name>
<name>
<surname>Light</surname> <given-names>A</given-names>
</name>
<name>
<surname>Alaa</surname> <given-names>A</given-names>
</name>
<name>
<surname>Thurtle</surname> <given-names>D</given-names>
</name>
<name>
<surname>van der Schaar</surname> <given-names>M</given-names>
</name>
<name>
<surname>Gnanapragasam</surname> <given-names>VJ</given-names>
</name>
</person-group>. <article-title>Application of a novel machine learning framework for predicting non-metastatic prostate cancer-specific mortality in men using the surveillance, epidemiology, and end results (SEER) database</article-title>. <source>Lancet Digit Health</source> (<year>2021</year>) <volume>3</volume>:<page-range>e158&#x2013;65</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/S2589-7500(20)30314-9</pub-id>
</citation>
</ref>
<ref id="B16">
<label>16</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname> <given-names>T</given-names>
</name>
<name>
<surname>Huang</surname> <given-names>H</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>S</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Jing</surname> <given-names>H</given-names>
</name>
<name>
<surname>Sun</surname> <given-names>T</given-names>
</name>
<etal/>
</person-group>. <article-title>Predictive models based on machine learning for bone metastasis in patients with diagnosed colorectal cancer</article-title>. <source>Front Public Health</source> (<year>2022</year>) <volume>10</volume>:<elocation-id>984750</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fpubh.2022.984750</pub-id>
</citation>
</ref>
<ref id="B17">
<label>17</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gu</surname> <given-names>L</given-names>
</name>
<name>
<surname>Xu</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Pan</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Lu</surname> <given-names>S</given-names>
</name>
</person-group>. <article-title>Clinical analysis of 95 cases of pulmonary sarcomatoid carcinoma</article-title>. <source>BioMed Pharmacother</source> (<year>2015</year>) <volume>76</volume>:<page-range>134&#x2013;40</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.biopha.2015.10.009</pub-id>
</citation>
</ref>
<ref id="B18">
<label>18</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Huang</surname> <given-names>S-Y</given-names>
</name>
<name>
<surname>Shen</surname> <given-names>S-J</given-names>
</name>
<name>
<surname>Li</surname> <given-names>X-Y</given-names>
</name>
</person-group>. <article-title>Pulmonary sarcomatoid carcinoma: a clinicopathologic study and prognostic analysis of 51 cases</article-title>. <source>World J Surg Oncol</source> (<year>2013</year>) <volume>11</volume>:<elocation-id>252</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/1477-7819-11-252</pub-id>
</citation>
</ref>
<ref id="B19">
<label>19</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Terra</surname> <given-names>SBSP</given-names>
</name>
<name>
<surname>Aubry</surname> <given-names>MC</given-names>
</name>
<name>
<surname>Yi</surname> <given-names>ES</given-names>
</name>
<name>
<surname>Boland</surname> <given-names>JM</given-names>
</name>
</person-group>. <article-title>Immunohistochemical study of 36 cases of pulmonary sarcomatoid carcinoma&#x2013;sensitivity of TTF-1 is superior to napsin</article-title>. <source>Hum Pathol</source> (<year>2014</year>) <volume>45</volume>:<fpage>294</fpage>&#x2013;<lpage>302</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.humpath.2013.09.005</pub-id>
</citation>
</ref>
<ref id="B20">
<label>20</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zombori-T&#xf3;th</surname> <given-names>N</given-names>
</name>
<name>
<surname>Kiss</surname> <given-names>S</given-names>
</name>
<name>
<surname>O&#x161;tarija&#x161;</surname> <given-names>E</given-names>
</name>
<name>
<surname>Alizadeh</surname> <given-names>H</given-names>
</name>
<name>
<surname>Zombori</surname> <given-names>T</given-names>
</name>
</person-group>. <article-title>Adjuvant chemotherapy could improve the survival of pulmonary sarcomatoid carcinoma: a systematic review and meta-analysis</article-title>. <source>Surg Oncol</source> (<year>2022</year>) <volume>44</volume>:<elocation-id>101824</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.suronc.2022.101824</pub-id>
</citation>
</ref>
<ref id="B21">
<label>21</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lococo</surname> <given-names>F</given-names>
</name>
<name>
<surname>Rapicetta</surname> <given-names>C</given-names>
</name>
<name>
<surname>Cardillo</surname> <given-names>G</given-names>
</name>
<name>
<surname>Stefani</surname> <given-names>A</given-names>
</name>
<name>
<surname>Margaritora</surname> <given-names>S</given-names>
</name>
<name>
<surname>Leuzzi</surname> <given-names>G</given-names>
</name>
<etal/>
</person-group>. <article-title>Pathologic findings and long-term results after surgical treatment for pulmonary sarcomatoid tumors: a multicenter analysis</article-title>. <source>Ann Thorac Surg</source> (<year>2017</year>) <volume>103</volume>:<page-range>1142&#x2013;50</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.athoracsur.2016.08.114</pub-id>
</citation>
</ref>
<ref id="B22">
<label>22</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liang</surname> <given-names>X</given-names>
</name>
<name>
<surname>Li</surname> <given-names>Q</given-names>
</name>
<name>
<surname>Xu</surname> <given-names>B</given-names>
</name>
<name>
<surname>Hu</surname> <given-names>S</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>Q</given-names>
</name>
<name>
<surname>Li</surname> <given-names>Y</given-names>
</name>
<etal/>
</person-group>. <article-title>Mutation landscape and tumor mutation burden analysis of Chinese patients with pulmonary sarcomatoid carcinomas</article-title>. <source>Int J Clin Oncol</source> (<year>2019</year>) <volume>24</volume>:<page-range>1061&#x2013;8</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s10147-019-01454-6</pub-id>
</citation>
</ref>
<ref id="B23">
<label>23</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname> <given-names>X</given-names>
</name>
<name>
<surname>Jia</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Stoopler</surname> <given-names>MB</given-names>
</name>
<name>
<surname>Shen</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Cheng</surname> <given-names>H</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>J</given-names>
</name>
<etal/>
</person-group>. <article-title>Next-generation sequencing of pulmonary sarcomatoid carcinoma reveals high frequency of actionable MET gene mutations</article-title>. <source>J Clin Oncol</source> (<year>2016</year>) <volume>34</volume>:<fpage>794</fpage>&#x2013;<lpage>802</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1200/JCO.2015.62.0674</pub-id>
</citation>
</ref>
<ref id="B24">
<label>24</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Awad</surname> <given-names>MM</given-names>
</name>
<name>
<surname>Oxnard</surname> <given-names>GR</given-names>
</name>
<name>
<surname>Jackman</surname> <given-names>DM</given-names>
</name>
<name>
<surname>Savukoski</surname> <given-names>DO</given-names>
</name>
<name>
<surname>Hall</surname> <given-names>D</given-names>
</name>
<name>
<surname>Shivdasani</surname> <given-names>P</given-names>
</name>
<etal/>
</person-group>. <article-title>MET exon 14 mutations in non-Small-Cell lung cancer are associated with advanced age and stage-dependent MET genomic amplification and c-met overexpression</article-title>. <source>J Clin Oncol</source> (<year>2016</year>) <volume>34</volume>:<page-range>721&#x2013;30</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1200/JCO.2015.63.4600</pub-id>
</citation>
</ref>
<ref id="B25">
<label>25</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Gao</surname> <given-names>L</given-names>
</name>
<name>
<surname>Ma</surname> <given-names>D</given-names>
</name>
<name>
<surname>Qiu</surname> <given-names>T</given-names>
</name>
<name>
<surname>Li</surname> <given-names>W</given-names>
</name>
<name>
<surname>Li</surname> <given-names>W</given-names>
</name>
<etal/>
</person-group>. <article-title>Identification of MET exon14 skipping by targeted DNA- and RNA-based next-generation sequencing in pulmonary sarcomatoid carcinomas</article-title>. <source>Lung Cancer</source> (<year>2018</year>) <volume>122</volume>:<page-range>113&#x2013;9</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.lungcan.2018.06.001</pub-id>
</citation>
</ref>
<ref id="B26">
<label>26</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Drusbosky</surname> <given-names>LM</given-names>
</name>
<name>
<surname>Dawar</surname> <given-names>R</given-names>
</name>
<name>
<surname>Rodriguez</surname> <given-names>E</given-names>
</name>
<name>
<surname>Ikpeazu</surname> <given-names>CV</given-names>
</name>
</person-group>. <article-title>Therapeutic strategies in METex14 skipping mutated non-small cell lung cancer</article-title>. <source>J Hematol Oncol</source> (<year>2021</year>) <volume>14</volume>:<fpage>129</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s13045-021-01138-7</pub-id>
</citation>
</ref>
<ref id="B27">
<label>27</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lu</surname> <given-names>S</given-names>
</name>
<name>
<surname>Fang</surname> <given-names>J</given-names>
</name>
<name>
<surname>Li</surname> <given-names>X</given-names>
</name>
<name>
<surname>Cao</surname> <given-names>L</given-names>
</name>
<name>
<surname>Zhou</surname> <given-names>J</given-names>
</name>
<name>
<surname>Guo</surname> <given-names>Q</given-names>
</name>
<etal/>
</person-group>. <article-title>Once-daily savolitinib in Chinese patients with pulmonary sarcomatoid carcinomas and other non-small-cell lung cancers harbouring MET exon 14 skipping alterations: a multicentre, single-arm, open-label, phase 2 study</article-title>. <source>Lancet Respir Med</source> (<year>2021</year>) <volume>9</volume>:<page-range>1154&#x2013;64</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/S2213-2600(21)00084-9</pub-id>
</citation>
</ref>
<ref id="B28">
<label>28</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cai</surname> <given-names>H</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>H</given-names>
</name>
<name>
<surname>Li</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Lin</surname> <given-names>J</given-names>
</name>
<name>
<surname>Yu</surname> <given-names>J</given-names>
</name>
</person-group>. <article-title>The prognostic analysis of different metastatic patterns in extensive-stage small-cell lung cancer patients: a large population-based study</article-title>. <source>Future Oncol</source> (<year>2018</year>) <volume>14</volume>:<page-range>1397&#x2013;407</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.2217/fon-2017-0706</pub-id>
</citation>
</ref>
<ref id="B29">
<label>29</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gao</surname> <given-names>H</given-names>
</name>
<name>
<surname>He</surname> <given-names>Z-Y</given-names>
</name>
<name>
<surname>Du</surname> <given-names>X-L</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>Z-G</given-names>
</name>
<name>
<surname>Xiang</surname> <given-names>L</given-names>
</name>
</person-group>. <article-title>Machine learning for the prediction of synchronous organ-specific metastasis in patients with lung cancer</article-title>. <source>Front Oncol</source> (<year>2022</year>) <volume>12</volume>:<elocation-id>817372</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fonc.2022.817372</pub-id>
</citation>
</ref>
<ref id="B30">
<label>30</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname> <given-names>M</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>Q</given-names>
</name>
<name>
<surname>Xu</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Luo</surname> <given-names>B</given-names>
</name>
<name>
<surname>Li</surname> <given-names>F</given-names>
</name>
<name>
<surname>Yu</surname> <given-names>Y</given-names>
</name>
<etal/>
</person-group>. <article-title>Survival analysis and prediction model for pulmonary sarcomatoid carcinoma based on SEER database</article-title>. <source>Front Oncol</source> (<year>2021</year>) <volume>11</volume>:<elocation-id>630885</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fonc.2021.630885</pub-id>
</citation>
</ref>
<ref id="B31">
<label>31</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cacho-D&#xed;az</surname> <given-names>B</given-names>
</name>
<name>
<surname>Cuapat&#xe9;ncatl</surname> <given-names>LD</given-names>
</name>
<name>
<surname>Rodr&#xed;guez</surname> <given-names>JA</given-names>
</name>
<name>
<surname>Garcilazo-Reyes</surname> <given-names>YJ</given-names>
</name>
<name>
<surname>Reynoso-Nover&#xf3;n</surname> <given-names>N</given-names>
</name>
<name>
<surname>Arrieta</surname> <given-names>O</given-names>
</name>
</person-group>. <article-title>Identification of a high-risk group for brain metastases in non-small cell lung cancer patients</article-title>. <source>J Neurooncol</source> (<year>2021</year>) <volume>155</volume>:<page-range>101&#x2013;6</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s11060-021-03849-w</pub-id>
</citation>
</ref>
<ref id="B32">
<label>32</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Park</surname> <given-names>S</given-names>
</name>
<name>
<surname>Lee</surname> <given-names>SM</given-names>
</name>
<name>
<surname>Ahn</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Kim</surname> <given-names>M</given-names>
</name>
<name>
<surname>Suh</surname> <given-names>CH</given-names>
</name>
<name>
<surname>Do</surname> <given-names>K-H</given-names>
</name>
<etal/>
</person-group>. <article-title>Identification of predictors for brain metastasis in newly diagnosed non-small cell lung cancer: a single-center cohort study</article-title>. <source>Eur Radiol</source> (<year>2022</year>) <volume>32</volume>:<fpage>990</fpage>&#x2013;<lpage>1001</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s00330-021-08215-y</pub-id>
</citation>
</ref>
</ref-list>
</back>
</article>