<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article article-type="research-article" dtd-version="2.3" xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Cell Dev. Biol.</journal-id>
<journal-title>Frontiers in Cell and Developmental Biology</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Cell Dev. Biol.</abbrev-journal-title>
<issn pub-type="epub">2296-634X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">769711</article-id>
<article-id pub-id-type="doi">10.3389/fcell.2022.769711</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Cell and Developmental Biology</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Integrated Analysis of MATH-Based Subtypes Reveals a Novel Screening Strategy for Early-Stage Lung Adenocarcinoma</article-title>
<alt-title alt-title-type="left-running-head">Li et&#x20;al.</alt-title>
<alt-title alt-title-type="right-running-head">A Novel Strategy for LUAD</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Li</surname>
<given-names>Chang</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="fn" rid="fn1">
<sup>&#x2020;</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/870682/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Tian</surname>
<given-names>Chen</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="fn" rid="fn1">
<sup>&#x2020;</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Zeng</surname>
<given-names>Yulan</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Liang</surname>
<given-names>Jinyan</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Yang</surname>
<given-names>Qifan</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Gu</surname>
<given-names>Feifei</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Hu</surname>
<given-names>Yue</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<uri xlink:href="https://loop.frontiersin.org/people/931471/overview"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Liu</surname>
<given-names>Li</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<uri xlink:href="https://loop.frontiersin.org/people/842101/overview"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>Cancer Center</institution>, <institution>Union Hospital</institution>, <institution>Tongji Medical College</institution>, <institution>Huazhong University of Science and Technology</institution>, <addr-line>Wuhan</addr-line>, <country>China</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>Department of Ultrasound</institution>, <institution>Union Hospital</institution>, <institution>Tongji Medical College</institution>, <institution>Huazhong University of Science and Technology</institution>, <addr-line>Wuhan</addr-line>, <country>China</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>
<bold>Edited by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/360059/overview">Zexian Liu</ext-link>, Sun Yat-sen University Cancer Center (SYSUCC), China</p>
</fn>
<fn fn-type="edited-by">
<p>
<bold>Reviewed by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/847026/overview">Wei-hsuan Yu</ext-link>, National Taiwan University, Taiwan</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/433963/overview">Keyue Ma</ext-link>, University of Texas at Austin, United&#x20;States</p>
</fn>
<corresp id="c001">&#x2a;Correspondence: Yue Hu, <email>huyue_cmu@126.com</email>; Li Liu, <email>liulist2013@163.com</email>
</corresp>
<fn fn-type="equal" id="fn1">
<label>
<sup>&#x2020;</sup>
</label>
<p>These authors have contributed equally to this&#x20;work</p>
</fn>
<fn fn-type="other">
<p>This article was submitted to Molecular and Cellular Oncology, a section of the journal Frontiers in Cell and Developmental Biology</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>08</day>
<month>02</month>
<year>2022</year>
</pub-date>
<pub-date pub-type="collection">
<year>2022</year>
</pub-date>
<volume>10</volume>
<elocation-id>769711</elocation-id>
<history>
<date date-type="received">
<day>02</day>
<month>09</month>
<year>2021</year>
</date>
<date date-type="accepted">
<day>19</day>
<month>01</month>
<year>2022</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2022 Li, Tian, Zeng, Liang, Yang, Gu, Hu and Liu.</copyright-statement>
<copyright-year>2022</copyright-year>
<copyright-holder>Li, Tian, Zeng, Liang, Yang, Gu, Hu and Liu</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these&#x20;terms.</p>
</license>
</permissions>
<abstract>
<p>Lung adenocarcinoma (LUAD) is a frequently diagnosed cancer type, and many patients have already reached an advanced stage when diagnosed. Thus, it is crucial to develop a novel and efficient approach to diagnose and classify lung adenocarcinoma at an early stage. In our study, we combined <italic>in silico</italic> analysis and machine learning to develop a new five-gene&#x2013;based diagnosis strategy, which was further verified in independent cohorts and <italic>in&#x20;vitro</italic> experiments. Considering the heterogeneity in cancer, we used the MATH (mutant-allele tumor heterogeneity) algorithm to divide patients with early-stage LUAD into two groups (C1 and C2). Specifically, patients in C2 had lower intratumor heterogeneity and higher abundance of immune cells (including B&#x20;cell, CD4 T&#x20;cell, CD8 T&#x20;cell, macrophage, dendritic cell, and neutrophil). In addition, patients in C2 had a higher likelihood of immunotherapy response and overall survival advantage than patients in C1. Combined drug sensitivity analysis (CTRP/PRISM/CMap/GDSC) revealed that BI-2536 might serve as a new therapeutic compound for patients in C1. In order to realize the application value of our study, we constructed the classifier (to classify early-stage LUAD patients into C1 or C2 groups) with multiple machine learning and bioinformatic analyses. The 21-gene&#x2013;based classification model showed high accuracy and strong generalization ability, and it was verified in four independent validation cohorts. In summary, our research provided a new strategy for clinicians to make a quick preliminary assisting diagnosis of early-stage LUAD and make patient classification at the intratumor heterogeneity level. All data, codes, and study processes have been deposited to Github and are available online.</p>
</abstract>
<kwd-group>
<kwd>lung adenocarcinoma</kwd>
<kwd>diagnosis</kwd>
<kwd>mutant allele tumor heterogeneity</kwd>
<kwd>machine learning</kwd>
<kwd>classification</kwd>
<kwd>immunotherapy</kwd>
<kwd>drug sensitivity</kwd>
</kwd-group>
<contract-num rid="cn001">2016YFC1303800</contract-num>
<contract-num rid="cn002">81773056 82073179</contract-num>
<contract-sponsor id="cn001">National Key Research and Development Program of China<named-content content-type="fundref-id">10.13039/501100012166</named-content>
</contract-sponsor>
<contract-sponsor id="cn002">National Natural Science Foundation of China<named-content content-type="fundref-id">10.13039/501100001809</named-content>
</contract-sponsor>
</article-meta>
</front>
<body>
<sec id="s1">
<title>Introduction</title>
<p>Non&#x2013;small cell lung cancer (NSCLC) is the most common variety of lung cancer, which is the leading cause of cancer-related death worldwide (<xref ref-type="bibr" rid="B5">Bray et&#x20;al., 2018</xref>; <xref ref-type="bibr" rid="B9">Duma et&#x20;al., 2019</xref>). Lung adenocarcinoma (LUAD) is the major histological type of NSCLC. According to previous studies, lung adenocarcinoma is often heterogenous. Despite that great advance in the treatment of LUAD has been made in the past few decades, the 5-years survival is still not satisfactory (<xref ref-type="bibr" rid="B3">Baba et&#x20;al., 2012</xref>; <xref ref-type="bibr" rid="B39">Zappa and Mousa, 2016</xref>; <xref ref-type="bibr" rid="B31">Shroff et&#x20;al., 2018</xref>). Due to the mild early symptoms, most patients have already reached an advanced stage when diagnosed, and it results in poor long-term overall survival. Thus, it is urgent to develop efficient biomarkers or signatures that could be used in the diagnosis of LUAD. Meanwhile, understanding the heterogeneity in early-stage lung adenocarcinoma is critical to select and develop more effective treatment.</p>
<p>Intratumor heterogeneity refers to the subclones of diverse genetic background within a tumor, and it is increasingly identified as a key factor in the treatment failure of human cancers. With the rise of next-generation sequencing and machine learning applications in oncology (<xref ref-type="bibr" rid="B6">Cho et&#x20;al., 2020</xref>; <xref ref-type="bibr" rid="B18">Li et&#x20;al., 2021</xref>; <xref ref-type="bibr" rid="B35">Wang et&#x20;al., 2021</xref>), computational approaches (such as ABSOLUTE) were developed to quantify intratumor heterogeneity based on biological information (<xref ref-type="bibr" rid="B33">Thorsson et&#x20;al., 2018</xref>). MATH (mutant-allele tumor heterogeneity) is a quantitative approach to depict ITH based on variant allele frequency information. In brief, mutant-allele fractions among genomic locus-bearing somatic mutations will be widely distributed in the tumors with distinct subclones, and MATH is a quantitative assessment to normalize the width of such distribution (<xref ref-type="bibr" rid="B28">Rocco, 2015</xref>; <xref ref-type="bibr" rid="B26">Ran et&#x20;al., 2020</xref>). In this study, we used MATH to quantify ITH of early-stage LUAD patients and intended to find MATH-based subtypes. We have explored not only the characteristics of these novel subtypes of LUAD but also the potential treatment for LUAD patients at an early&#x20;stage.</p>
</sec>
<sec sec-type="materials|methods" id="s2">
<title>Materials and Methods</title>
<sec id="s2-1">
<title>Data Pre-processing</title>
<p>RNA sequencing of combined TCGA and GTEx data (free of computational batch effects) and TCGA-LUAD (lung adenocarcinoma) data were downloaded from UCSC Xena (<ext-link ext-link-type="uri" xlink:href="https://xenabrowser.net/datapages/">https://xenabrowser.net/datapages/</ext-link>). Relevant clinical information was also collected from the UCSC Xena browser. The expression data derived from TCGA database were pre-processed by the following steps: 1) removing samples without clinical information; 2) preserving early-stage (stage I and stage II) samples; and 3) expression data were TPM-normalized and genes with log2 (TPM&#x2b;1) &#x3e;0 were preserved. Additionally, copy number alteration and somatic mutation MAF data were downloaded from TCGA data portal (<ext-link ext-link-type="uri" xlink:href="https://portal.gdc.cancer.gov/">https://portal.gdc.cancer.gov/</ext-link>).</p>
<p>The independent validation cohorts (including GSE30219, GSE31210, GSE50081, and GSE72094) were downloaded from GEO (Gene Expression Omnibus, <ext-link ext-link-type="uri" xlink:href="http://www.ncbi.nlm.nih.gov/geo/">http://www.ncbi.nlm.nih.gov/geo/</ext-link>). Detailed information of the study cohorts is shown in the <italic>Supplementary Material</italic>.</p>
</sec>
<sec id="s2-2">
<title>Construction of the Diagnosis Model</title>
<p>Differential gene expression analysis between non-cancerous lung tissues and lung adenocarcinoma tissues was conducted in TCGA-GTEx, GSE30219, and GSE31210 cohorts. DEGs were identified by having log2fc &#x3e; 1 and fdr &#x3c;0.05. Robust rank aggregation (RRA) was used to identify overlapping DEGs (<xref ref-type="bibr" rid="B10">Gan et&#x20;al., 2020</xref>), which were used to develop the diagnosis model. The patients in TCGA-GTEx cohorts were randomly assigned to the training and validation group at a ratio of 7:3. The other datasets (GSE30219 and GSE31210) were used as two independent validation cohorts. Machine learning including elastic net regression (ElasticNet, binomial, alpha &#x3d; 0.9), Random Forest and Bortua (RFB, default), Support Vector Machine-Recursive Feature Elimination (SVM-RFE, svmRFE function in R, k &#x3d; 5, halve. above &#x3d; 100), and eXtreme Gradient Boosting (XGBoost, xgboost function in R, default) was performed to identify the most important predictors. The expression of the overlapping DEGs was used as the input variable, and the status of the tissues (tumor or non-cancerous lung tissue, 1 or 0) was set as the response variable. In the training group, the intersect genes identified by ElasticNet, RFB, SVM-RFE, and XGBoost were collected, and logistic regression analysis was performed on these genes to develop the diagnosis model. The performance of the diagnosis model (in the training and validation group, as well as two independent validation cohorts) was evaluated by receiver operating characteristic (ROC) curves and AUC values.</p>
</sec>
<sec id="s2-3">
<title>Real-Time Quantitative Polymerase Chain Reaction</title>
<p>Total RNA was extracted with TRIzol reagent (Takara), and the synthesis of cDNA was conducted with the qPCR RT Master Mix (Toyobo). To detect the expression of target genes, PCR was performed with the SYBR Green Real-Time PCR kit (Takara) on the StepOnePlus&#x2122; Real-Time PCR System (ABI) based on the manufacturer&#x2019;s instructions. GAPDH was selected as the internal control, and the relative expression levels were determined by comparative Ct (target gene Ct minus GAPDH Ct). Sequences of the primers are listed as follows:</p>
<p>B3GNT3-F: CTT&#x200b;GCT&#x200b;GTC&#x200b;CCG&#x200b;CTT&#x200b;CAC.</p>
<p>B3GNT3-R: GAG&#x200b;GCA&#x200b;GGC&#x200b;TTC&#x200b;AGT&#x200b;CCC.</p>
<p>GALNT7-F: GAA&#x200b;TCG&#x200b;CAG&#x200b;GCA&#x200b;TTA&#x200b;CCA.</p>
<p>GALNT7-R: AAG&#x200b;CCT&#x200b;CTG&#x200b;ATT&#x200b;TCT&#x200b;CCC.</p>
<p>PLEK2-F: CAC&#x200b;GGT&#x200b;GGT&#x200b;GAA&#x200b;ACA&#x200b;AGG.</p>
<p>PLEK2-R: CAG&#x200b;TGG&#x200b;GAA&#x200b;CGC&#x200b;CAT&#x200b;TAT.</p>
<p>GAPDH-F: GAG&#x200b;TCA&#x200b;ACG&#x200b;GAT&#x200b;TTG&#x200b;GTC&#x200b;GT.</p>
<p>GAPDH-R: GAC&#x200b;AAG&#x200b;CTT&#x200b;CCC&#x200b;GTT&#x200b;CTC&#x200b;AG.</p>
</sec>
<sec id="s2-4">
<title>CCK-8 Assay</title>
<p>The cells were seeded in 96-well plates at 2000 cells per well (A549) or 1800 cells per well (H1299) with complete medium. After 1, 2, 3, and 4&#x20;days of culture, the CCK-8 kit (Dojindo) was used to detect cell proliferation, and the absorbance was read at 450&#xa0;nm.</p>
</sec>
<sec id="s2-5">
<title>Calculation of the MATH Value and Gene Expression&#x2013;Based Stemness Index</title>
<p>Mutant-allele tumor heterogeneity (MATH) is a quantitative strategy to quantify the dispersion of allele frequencies of somatic mutations based on whole-exome sequencing data (<xref ref-type="bibr" rid="B28">Rocco, 2015</xref>; <xref ref-type="bibr" rid="B21">McDonald et&#x20;al., 2019</xref>). MATH score was calculated by &#x201c;inferHeterogenetiy&#x201d; function (&#x201c;maftools&#x201d; package in R). In this study, MATH score was used to measure intratumor heterogeneity (ITH), and we compared the MATH score with the ABSOLUTE score (obtained from Thorsson V et&#x20;al. study) to ensure it could reflect the ITH accurately.</p>
<p>To calculate the mRNAsi, Malta et&#x20;al. built a predictive model using one-class logistic regression (OCLR) on the Progenitor Cell Biology Consortium cohort to calculate stemness signatures, which contains the gene expression profile of 11,774 genes (<xref ref-type="bibr" rid="B19">Lian et&#x20;al., 2019</xref>). We applied the stemness signature to calculate the mRNAsi index for patients in our study using Spearman&#x2019;s correlation analysis.</p>
</sec>
<sec id="s2-6">
<title>Identification of the MATH-Based Molecular Subtypes of Lung Adenocarcinoma at an Early Stage</title>
<p>To classify patients into the MATH-based subtypes, survival analysis was performed, and X-tile was used to determine the optimal cutoff of the MATH score (<xref ref-type="bibr" rid="B15">Li et&#x20;al., 2016</xref>). Afterward, the high-MATH group and low-MATH group were generated, and differential gene expression analysis was performed to find DEGs differentially between the two groups. Unsupervised consensus clustering (kmeans, &#x201c;ConsensusClusterPlus&#x201d; package in R) (<xref ref-type="bibr" rid="B35">Wang et&#x20;al., 2021</xref>) based on these DEGs was conducted to explore a novel classification of lung adenocarcinoma: the MATH-based subtypes. This procedure was repeated 1,000&#x20;times and sampled 80% in each iteration to ensure classification stability.</p>
</sec>
<sec id="s2-7">
<title>Calculation of CNA Burden, TMB, and Immunological Characteristics</title>
<p>CNA (copy number alteration) data of TCGA cohort was obtained from TCGA data portal. Amplified or deleted genomes in the whole genome were identified by GISTIC 2.0. The burden of copy number loss or gain was defined as the total number of genes with copy number changes in each sample at the arm and focal levels (<xref ref-type="bibr" rid="B30">Shen R et&#x20;al., 2019</xref>).</p>
<p>TMB was defined as the number of non-synonymous alterations per MB of the genome. Non-synonymous mutations were defined as &#x201c;Frame_Shift_Del&#x201d;, &#x201c;Frame_Shift_Ins&#x201d;, &#x201c;Missense_Mutation&#x201d;, &#x201c;Nonsense_Mutation&#x201d;, &#x201c;Splice_Site&#x201d;, &#x201c;In_Frame_Del&#x201d;, &#x201c;In_Frame_Ins&#x201d;, &#x201c;Translation_Start_Site&#x201d;, and &#x201c;Nonstop_Mutation&#x201d;. The exome size was defined as 38&#xa0;Mb as described in the previous study. TMB was calculated by this formula: TMB &#x3d; non-synonymous mutations/exome size (38&#xa0;Mb) (<xref ref-type="bibr" rid="B34">Wang et&#x20;al., 2019</xref>).</p>
<p>The abundance of six immune cells (including B&#x20;cell, macrophage, dendritic cell, neutrophil, T&#x20;cell CD4, and T&#x20;cell CD8) was calculated by TIMER (<xref ref-type="bibr" rid="B17">Li et&#x20;al., 2020</xref>). The abundance of intratumoral immune and stromal cells was predicted using the ESTIMATE algorithm (&#x201c;ESTIMATE&#x201d; package in R) (<xref ref-type="bibr" rid="B38">Yoshihara et&#x20;al., 2013</xref>). In addition, the enrichment level of 29 immune signatures (<xref ref-type="bibr" rid="B37">Yang et&#x20;al., 2018</xref>), which represent the immune activity of tumors, and three signatures (<xref ref-type="bibr" rid="B23">Messina et&#x20;al., 2012</xref>; <xref ref-type="bibr" rid="B2">Ayers et&#x20;al., 2017</xref>; <xref ref-type="bibr" rid="B13">Jiang et&#x20;al., 2018</xref>), which represent the immunotherapy response, was quantified by ssGSEA (single-sample gene set enrichment analysis).</p>
</sec>
<sec id="s2-8">
<title>Prediction of TIDE Score and Immunotherapy Response</title>
<p>TIDE (tumor immune dysfunction and exclusion, <ext-link ext-link-type="uri" xlink:href="http://tide.dfci.harvard.edu/">http://tide.dfci.harvard.edu/</ext-link>) score, which was developed based on the mechanism of tumor immune escape, inducing T&#x20;cell dysfunction in tumors with high infiltration of cytotoxic T lymphocytes (CTL) and inhibiting T&#x20;cell infiltration in tumors with low CTL level, was used to predict the clinical response to immunotherapy of patients involved in our study (<xref ref-type="bibr" rid="B13">Jiang et&#x20;al., 2018</xref>). The gene expression value had been normalized before calculation. Then, subclass mapping was processed to realize the prediction of clinical response to anti-PD1 or anti-CTLA4 therapy (<xref ref-type="bibr" rid="B12">Hubble et&#x20;al., 2009</xref>) (&#x201c;SubMap&#x201d; modules in GenePattern, <ext-link ext-link-type="uri" xlink:href="https://cloud.genepattern.org/gp/pages/index.jsf">https://cloud.genepattern.org/gp/pages/index.jsf</ext-link>. A published dataset with melanoma that responded to immunotherapy was set as the reference; custom settings were set as default).</p>
</sec>
<sec id="s2-9">
<title>Construction and Validation of the MATH-Based Subtype Classifier</title>
<p>The TCGA-LUAD patients at an early stage were randomly assigned to the training and validation group at a ratio of 7:3. GSE30219, GSE31210, GSE50081, and GSE72094 were used as external independent validation cohorts. Machine learning algorithms, including ElasticNet, RFB, SVM-RFE, and XGBoost, were performed to identify the most important predictors. The expression of the DEGs was used as the input variable, and the subtype of the sample (subtype I or subtype II, 0 or 1) was set as the response variable. In the training group, the intersect genes identified by ElasticNet, RFB, SVM-RFE, and XGBoost were collected, and logistic regression analysis was performed on these genes to develop the classification model. The model was tested in the validation group. In order to test our classifier generalization ability in the external independent validation cohorts (GSE30219, GSE31210, GSE50081, and GSE72094), we performed the following analysis: 1) performing the same k-means clustering in each cohort based on the same DEGs; 2) comparing the expression profile of the subtypes we defined in TCGA cohort with k-means clustering results in each validation cohort (by using &#x201c;SubMap&#x201d; module in GenePattern); and 3) determining the clustering subtypes in the validation cohorts. The performance of the classifier was investigated by AUC values.</p>
</sec>
<sec id="s2-10">
<title>Drug Sensitivity Analysis</title>
<p>Three approaches were used to conduct drug sensitivity analysis. First, we used the CTRP (Cancer Therapeutics Response Portal) and PRISM (Profiling Relative Inhibition Simultaneously in Mixtures) to generate drug sensitivity data (<xref ref-type="bibr" rid="B27">Rees et&#x20;al., 2016</xref>; <xref ref-type="bibr" rid="B7">Corsello et&#x20;al., 2020</xref>). Both databases used AUC values as a measure of drug/compound sensitivity. Compounds with missing AUC values &#x3e; 20% of the samples and cell lines were excluded. The &#x201c;pRRophetic&#x201d; package was used to predict the candidate potential drugs in each MATH-based subtype. Then, we predicted the candidate potential drug response for each sample based on the GDSC (the Genomics of Drug Sensitivity in Cancer) database (<xref ref-type="bibr" rid="B36">Yang et&#x20;al., 2013</xref>). IC<sub>50</sub> (the samples&#x2019; half-maximal inhibitory concentration) was estimated based on the GDSC dataset. In addition, we used the CMap (Connectivity Map) database to explore the drugs targeting the genes associated with the MATH-based subtypes (<xref ref-type="bibr" rid="B25">Musa et&#x20;al., 2018</xref>). We queried the CMap database and selected the compound with a negative enrichment score and <italic>p</italic>&#x20;&#x3c; 0.05. The compound overlapping in the results of CTRP/PRISM, GDSC, and CMap analyses was considered important and may serve as a potential treatment for the certain subtype.</p>
</sec>
<sec id="s2-11">
<title>Statistical Analysis</title>
<p>The &#x3c7;<sup>2</sup> test was utilized to evaluate the association between subtypes and mutations. The Shapiro&#x2013;Wilk normality test was used to test the normality of data. Correlations were analyzed using Spearman&#x2019;s correlation. Statistical analyses were conducted using Kruskal&#x2013;Wallis, Wilcoxon, or Student&#x2019;s t&#x20;test. Differences were thought to be significant at <italic>p</italic>&#x20;&#x3c; 0.05. All analyses were performed in R (Version: 3.5.3). All data, codes, and workflow have been deposited to Github.</p>
</sec>
</sec>
<sec sec-type="results" id="s3">
<title>Result</title>
<sec id="s3-1">
<title>Establishment of the Early-Stage LUAD Diagnostic Model</title>
<p>The general workflow of this study is shown in <xref ref-type="fig" rid="F1">Figure&#x20;1</xref>. Differential analysis between early-stage lung adenocarcinoma tissues and non-cancerous lung tissues was performed with Limma package, and a total of 173 DEGs (differentially expressed genes) were screened <italic>via</italic> robust rank aggregation (<xref ref-type="fig" rid="F2">Figure&#x20;2A</xref>). In order to investigate the diagnostic method for early-stage LUAD, the TCGA-GTEx cohort was divided into training and validation cohorts, and two cohorts (GSE30219 and GSE31210) were used as the external validation sets (<xref ref-type="table" rid="T1">Table&#x20;1</xref>, <xref ref-type="sec" rid="s10">Supplementary Table S1</xref>). As described in <italic>Materials and Methods</italic>, four machine learning algorithms (including ElasticNet, RFB, SVM-RFE, and XGBoost) were applied in TCGA-GTEx training set (<xref ref-type="sec" rid="s10">Supplementary Figure S1A-F</xref>). Among the 173 DEGs, five genes (<xref ref-type="sec" rid="s10">Supplementary Table S2</xref>, including B3GNT3, PLEK2, GALNT7, GRK5, and SLC39A8) were found overlapping in different ML methods (<xref ref-type="fig" rid="F2">Figure&#x20;2B</xref>, <xref ref-type="sec" rid="s10">Supplementary Table S3</xref>). The combination of the five genes was analyzed using logistic regression to generate the diagnosis model for early-stage LUAD. The confusion matrix for TCGA-GTEx validation set and two external validation sets (GSE30219 and GSE31210) were shown in <xref ref-type="fig" rid="F2">Figure&#x20;2C</xref> and <xref ref-type="sec" rid="s10">Supplementary Figure S1G</xref>, with AUCs of 0.982, 0.817, and 0.850, respectively.</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption>
<p>Flowchart of this study.</p>
</caption>
<graphic xlink:href="fcell-10-769711-g001.tif"/>
</fig>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption>
<p>Construction of the early-stage LUAD diagnosis model. <bold>(A)</bold> Heat map showed differentially expressed genes in tumor tissues (abs logFC&#x3e;1, fdr&#x3c;0.05) identified by RRA. Rows represent DEGs and columns represent different datasets. <bold>(B)</bold> Venn diagram identified five diagnosis genes shared by ElasticNet, SVM-RFE, RFB, and XGBoost machine learning. <bold>(C)</bold>. Confusion matrix of binary result of the diagnosis model for the internal validation cohort.</p>
</caption>
<graphic xlink:href="fcell-10-769711-g002.tif"/>
</fig>
<table-wrap id="T1" position="float">
<label>TABLE 1</label>
<caption>
<p>Clinical information of early-stage LUAD patients in TCGA cohort.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Characteristics</th>
<th align="left"/>
<th align="center">No of.cases (N&#x20;&#x3d;&#x20;389)</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">Gender</td>
<td align="left">Female</td>
<td align="center">213</td>
</tr>
<tr>
<td align="left"/>
<td align="left">Male</td>
<td align="center">176</td>
</tr>
<tr>
<td align="left">Primary therapy outcome</td>
<td align="left">Complete remission/response</td>
<td align="center">236</td>
</tr>
<tr>
<td align="left"/>
<td align="left">Partial remission/response</td>
<td align="center">2</td>
</tr>
<tr>
<td align="left"/>
<td align="left">Stable disease</td>
<td align="center">19</td>
</tr>
<tr>
<td align="left"/>
<td align="left">Progressive disease</td>
<td align="center">36</td>
</tr>
<tr>
<td align="left"/>
<td align="left">Unknown</td>
<td align="center">96</td>
</tr>
<tr>
<td align="left">Neoadjuvant treatment</td>
<td align="left">No</td>
<td align="center">388</td>
</tr>
<tr>
<td align="left"/>
<td align="left">Yes</td>
<td align="center">1</td>
</tr>
<tr>
<td align="left">Stage</td>
<td align="left">Stage I</td>
<td align="center">271</td>
</tr>
<tr>
<td align="left"/>
<td align="left">Stage II</td>
<td align="center">118</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>The diagnostic model showed good prediction ability. Among the five genes involved in the diagnosis formula, the coefficients of three genes (B3GNT3, GALNT7, and PLEK2) were positive, indicating that the higher the expression level of these genes, the higher the likelihood of being diagnosed with cancer. These three genes might play an oncogene role in lung cancer. To prove this, we respectively downregulated the expression of B3GNT3, GALNT7, PLEK2 in A549 and H1299 cells via RNAi treatment (<xref ref-type="sec" rid="s10">Supplementary Figure S2</xref>). As expected, the silencing of these genes inhibited lung cancer cell proliferation and growth (<xref ref-type="fig" rid="F3">Figures 3A&#x2013;D</xref>, B3GNT3, <xref ref-type="fig" rid="F3">Figures 3E&#x2013;H</xref>, GALNT7, <xref ref-type="fig" rid="F3">Figure&#x20;3I</xref>-L, PLEK2).</p>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption>
<p>Downregulation of B3GNT3, GALNT7, or PLEK2 suppresses tumorigenesis in lung cancer. <bold>(A&#x2013;B)</bold> CCK-8 assay revealed that B3GNT3 silencing impaired cell proliferation in A549 (A) and H1299 (B) (n &#x3d; 5). <bold>(C&#x2013;D)</bold> B3GNT3 depletion significantly weakened colony-forming capacity of A549 (C) and H1299 (D) (n &#x3d; 3). <bold>(E&#x2013;H)</bold> GALNT7. <bold>(I&#x2013;L)</bold> PLEK2. &#x2a;&#x2a;<italic>p</italic>&#x20;&#x3c; 0.01 and &#x2a;&#x2a;&#x2a;<italic>p</italic>&#x20;&#x3c; 0.001.</p>
</caption>
<graphic xlink:href="fcell-10-769711-g003.tif"/>
</fig>
</sec>
<sec id="s3-2">
<title>Association Between MATH and Immune Infiltration Pattern</title>
<p>First, to explore the overall immune activity of the 389&#x20;early-stage LUAD patients in TCGA cohort, the enrichment abundance of 29&#x20;immune-related signatures was quantified using ssGSEA. As shown in the heatmap (<xref ref-type="sec" rid="s10">Supplementary Figure S3A</xref>), the 389 patients were assigned to three different immune subtypes according to hierarchical clustering. The immune cluster 1, containing 134 (34.4%) patients, had the low enrichment level; the immune cluster 2, containing 74 (19%) patients, had the highest enrichment scores; and the immune cluster 3, containing 181 (46.5%) patients, was characterized by the medium enrichment level. Afterward, immune cell infiltration pattern was evaluated by the TIMER platform and ESTIMATE algorithm. The immune cluster 2 had the highest immune scores and stromal scores (<xref ref-type="sec" rid="s10">Supplementary Figure S3E-F</xref>), indicating its high immunity, while immune cluster 1 showed the opposite. Six immune cell abundance (including B&#x20;cell, macrophage, dendritic cell, neutrophil, CD4 T&#x20;cell, and CD8 T&#x20;cell, quantified by the TIMER platform) showed a gradual decrease from immune cluster 2 to immune cluster 3 to immune cluster 1 (<xref ref-type="sec" rid="s10">Supplementary Figure S3B</xref>). Hence, immune clusters 1&#x2013;3 were defined as low-immunity group, high-immunity group, and medium-immunity group, respectively. By using the OCLR algorithm built by <xref ref-type="bibr" rid="B19">Lian et&#x20;al. (2019)</xref>, stemness index (mRNAsi) of 389 LUAD patients was calculated based on gene expression data. However, mRNAsi was not different among the three groups (<xref ref-type="sec" rid="s10">Supplementary Figure S3C</xref>, Kruskal&#x2013;Wallis test, <italic>p</italic>-value &#x3d;&#x20;0.61).</p>
<p>According to the previous study (<xref ref-type="bibr" rid="B28">Rocco, 2015</xref>), the heterogeneity in the tumor led to differences among mutated loci in terms of the fraction of sequence reads that show a mutant allele. The ratio of the width to the center of the distribution of mutant allele fractions, which is defined as MATH (mutant-allele tumor heterogeneity), is a reflection of the dispersion of variant allele frequencies, thus serving as a measure of intratumor heterogeneity. The MC3 file for TCGA-LUAD was analyzed, and MATH score for 389 patients was calculated using &#x201c;inferHeterogenetiy&#x201d; function (&#x201c;maftool&#x201d; package in R, <xref ref-type="fig" rid="F4">Figure&#x20;4A</xref>). Then, we investigated the relationship between MATH score and ABSOLUTE score. A significant positive correlation between MATH and ABSOLUTE was observed (<xref ref-type="fig" rid="F4">Figure&#x20;4C</xref>, <italic>p</italic>&#x20;&#x3c; 0.001), indicating that the MATH score could well reflect the ITH, so the MATH score was used to measure intratumor heterogeneity in our study. Notably, the MATH score seems to be negatively correlated with immune infiltration: immune cluster 2, which was defined as the high-immunity group, had the lowest MATH score as compared to other clusters (<xref ref-type="sec" rid="s10">Supplementary Figure S3D</xref>, Kruskal&#x2013;Wallis test, <italic>p</italic>&#x20;&#x3d; 0.005 and 0.074, respectively); and general negative correlation was observed between the MATH score and the abundance of immune cells (<xref ref-type="fig" rid="F4">Figures 4D,F&#x2013;K</xref>), which supported the notion that tumor-infiltrating immune cells shape the ITH. In addition, a positive correlation between mRNAsi and the MATH score was observed (<xref ref-type="fig" rid="F4">Figure&#x20;4E</xref>, <italic>p</italic>&#x20;&#x3c; 0.001). To explore the potential link between the MATH score and clinical outcome, survival analysis was performed, and the optimal cutoff point of MATH score was determined by X-tile. Kaplan&#x2013;Meier plot indicated that patients classified into the high-MATH group tended to have a worse overall survival outcome (<xref ref-type="fig" rid="F4">Figure&#x20;4B</xref>, Log-rank test, <italic>p</italic>&#x20;&#x3d; 0.04). Briefly, the abovementioned results indicated that the MATH score was negatively correlated with tumor immune infiltration, and high ITH led to worse clinical outcome.</p>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption>
<p>MATH associated with TIME and clinical outcome in early-stage LUAD patients. <bold>(A)</bold> Calculation of the MATH score in the main cohort and an overview of association between MATH and mRNAsi and immunity. <bold>(B)</bold> Survival analysis indicated significantly better overall survival in the low-MATH group. <bold>(C)</bold> Association between MATH and subclonal genome fraction quantified by ABSOLUTE. <bold>(D)</bold> Association between MATH and immune-score quantified by ESTIMATE. <bold>(E)</bold> Association between MATH and stemness index calculated by OCLR. <bold>(F&#x2013;K)</bold> Association between MATH and tumor-infiltrating immune cells, including B&#x20;cell, CD4 T&#x20;cell, macrophage, CD8 T&#x20;cell, dendritic cell, and neutrophil.</p>
</caption>
<graphic xlink:href="fcell-10-769711-g004.tif"/>
</fig>
</sec>
<sec id="s3-3">
<title>Identification of Two MATH-Based Subtypes With Distinct Characteristics</title>
<p>Since survival difference was observed between the high- and low-MATH groups, we conducted differential gene expression analysis. A total of 104 DEGs were identified (<xref ref-type="sec" rid="s10">Supplementary Figure S4A</xref>), which were defined as MATH-related DEGs. To unveil the MATH subtype, we further performed unsupervised consensus clustering (K-means) for early-stage LUAD patients based on the expression patterns of MATH-related DEGs (<xref ref-type="sec" rid="s10">Supplementary Figure S4B</xref>, <xref ref-type="sec" rid="s10">Supplementary Table S4</xref>). Thus, 389&#x20;early-stage LUAD patients were classified into cluster 1 (159 patients, 40.9%) and cluster 2 (230 patients, 59.1%) (<xref ref-type="fig" rid="F5">Figure&#x20;5A</xref>), where cluster 1 tended to have a higher mRNAsi and MATH score (<xref ref-type="fig" rid="F5">Figure&#x20;5G</xref>, <xref ref-type="sec" rid="s10">Supplementary Figure S4C-D</xref>). Subsequently, immune cell abundance was compared between cluster 1 and cluster 2 (<xref ref-type="fig" rid="F5">Figure&#x20;5B</xref>), and the six immune cells (B&#x20;cell, CD4 T&#x20;cell. CD8 T&#x20;cell, macrophage, dendritic cell, and neutrophil, quantified by TIMER) were more abundant in cluster 2. The expression level of immune checkpoint molecules PD1 and CTLA-4, with its ligands (PDL1/PDL2, and CD80/CD86), was compared between C1 and C2. The results showed higher expression of these molecules in C2 (<xref ref-type="fig" rid="F5">Figure&#x20;5C</xref>). In addition, immune cluster 2 had a higher proportion in C2 than C1, while immune cluster 1 had the opposite (<xref ref-type="fig" rid="F5">Figure&#x20;5H</xref>).</p>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption>
<p>Identification of two MATH-based clusters with distinct characteristics and survival outcome. <bold>(A)</bold> Heat map showed the result of the unsupervised consensus clustering based on the 104 DEGs, and two clusters were identified. <bold>(B)</bold> Comparison of the abundance of B&#x20;cell, CD4 T&#x20;cell, CD8 T&#x20;cell, macrophage, dendritic cell, and neutrophil between C1 and C2. <bold>(C)</bold> Comparison of the expression level of PD-1/PD-L1/PD-L2/CTLA-4/CD80/CD86 between C1 and C2. <bold>(D&#x2013;F)</bold> Comparison of the enrichment level of three immunotherapy-related signatures between C1 and C2, including CD8. sig, EIGS (expanded immune gene signature), and 12 chemokines sig. <bold>(G)</bold> Patients in C1 had a higher MATH score than patients in C2. <bold>(H)</bold> Distinct proportions of different immune clusters in C1 and C2, indicating the different immunity between the two subtypes. <bold>(I)</bold>. TIDE algorithm predicted the likelihood of response to immunotherapy in C1 and C2.</p>
</caption>
<graphic xlink:href="fcell-10-769711-g005.tif"/>
</fig>
<p>To predict the response to ICI (immune checkpoint inhibitor) therapy for patients in different clusters, the enrichment level of three immunotherapy-related signatures was quantified using ssGSEA. As compared to C1, patients in C2 had a significant higher enrichment of these signatures (CD8. sig, EIGS, 12-chemokines, <xref ref-type="fig" rid="F5">Figures 5D&#x2013;F</xref>), indicating that patients in C2 might have better response to ICI therapy. In addition, the TIDE algorithm was used to predict immunotherapy response. The result showed that the proportion of responders to immunotherapy in C2 was significantly higher than that in C1 (<xref ref-type="fig" rid="F5">Figure&#x20;5I</xref>, chi-square test, <italic>p</italic>&#x20;&#x3c; 0.001). Next, subclass mapping was performed (&#x201c;SubMap&#x201d; module in GenePattern), and a melanoma immunotherapy cohort was set as the reference. It was found that patients in C2 might have better response to anti-PD1 or anti-CTLA4 therapy (<xref ref-type="fig" rid="F6">Figure&#x20;6B</xref>). Afterward, we performed GSEA (gene set enrichment analysis) to identify hallmarks associated with different MATH clusters. GSEA results revealed that &#x201c;Glycolysis&#x201d;, &#x201c;MYC_target&#x201d;, &#x201c;MTORC1 signaling&#x201d;, and &#x201c;PI3K-AKT-MTOR signaling&#x201d; were enriched in C1, while &#x201c;IL2-STAT5 signaling&#x201d;, &#x201c;inflammatory response&#x201d;, &#x201c;IFN-gamma response&#x201d;, &#x201c;P53 pathway&#x201d;, and &#x201c;TNFA signaling&#x201d; were enriched in C2 (<xref ref-type="sec" rid="s10">Supplementary Figure S4E-F</xref>). In brief, the abovementioned results indicated that samples in C2 had higher immune infiltration and immunogenicity, and patients in C2 had higher likelihood of response to immunotherapy than&#x20;C1.</p>
<fig id="F6" position="float">
<label>FIGURE 6</label>
<caption>
<p>MATH-based subtype was a prevalent phenomenon in early-stage LUAD. <bold>(A)</bold>. Kaplan&#x2013;Meier survival analysis revealed significantly better overall survival in patients in C2. <bold>(B)</bold> Submap analysis for predicting the likelihood of immunotherapy response for C1 and C2. <bold>(C&#x2013;F)</bold> Different clinical overall survival outcomes between C1 and C2 in GSE30219, GSE50081, GSE31210, and GSE72094.</p>
</caption>
<graphic xlink:href="fcell-10-769711-g006.tif"/>
</fig>
</sec>
<sec id="s3-4">
<title>The MATH-Based Clusters are Prevalent in Early-Stage Lung Adenocarcinoma</title>
<p>We analyzed the survival outcome of the two clusters, and the result revealed that patients in C2 had better overall survival (<xref ref-type="fig" rid="F6">Figure&#x20;6A</xref>, TCGA cohort, log-rank test, <italic>p</italic>&#x20;&#x3d; 0.046). To investigate whether the two clusters were widespread in early-stage lung adenocarcinoma, we performed the same unsupervised consensus clustering (based on MATH-related DEGs) in GSE30219 (N &#x3d; 85), GSE31210 (N &#x3d; 226), GSE50081 (N &#x3d; 127), and GSE72094 (N &#x3d; 334). In all four independent validation sets, the early-stage LUAD patients could be classified into two groups, and patients in C1 tended to have a worse survival outcome (<xref ref-type="fig" rid="F6">Figures 6C&#x2013;F</xref>, log-rank test, <italic>p</italic>-value GSE30219: 0.28; GSE31210: 0.013; GSE50081: 0.034; GSE72094: &#x3c;0.0001), which was consistent with our previous result. The survival difference did not reach statistical significance in the GSE30219 cohort, which might be due to the small sample size. To prove that the clusters generated in the validation cohorts were the same as those in TCGA cohort, we further performed submap analysis. As shown in the figure, the C1/C2 clusters of the validation cohorts could be well-mapped into the C1/C2 clusters of TCGA cohort (<xref ref-type="sec" rid="s10">Supplementary Figure S5</xref>, all <italic>p</italic>-value and FDR &#x3c;0.01). The result revealed that the MATH-based clusters are stable and widespread in early-stage lung adenocarcinoma, and patients in C2 tend to have a better survival outcome.</p>
</sec>
<sec id="s3-5">
<title>Construction and Validation of the Cluster Predictor</title>
<p>Since early-stage LUAD patients could be classified into two distinct clusters, we attempted to build a classifier to predict patient groups. TCGA cohort was divided into training and validation groups at a ratio of 7:3. GSE30219, GSE31210, GSE50081, and GSE72094 were used as external validation cohorts. In the training group, ML algorithms were applied to screen important features based on the expression file of 104&#x20;MATH-related DEGs, and a total of 37, 79, 58, and 63 genes were identified by ElasticNet, SVM-RFE, Xgboost, and RFB, respectively (<xref ref-type="sec" rid="s10">Supplementary Figure S6</xref>, <xref ref-type="sec" rid="s10">Supplementary Table S5</xref>). Twenty-four genes were found overlapping in different ML methods (<xref ref-type="fig" rid="F7">Figure&#x20;7A</xref>). To construct the classifier, we reduced the 24 genes to 21 genes that were common to all datasets. The combination of the 21 genes was analyzed using logistic regression (<xref ref-type="fig" rid="F7">Figure&#x20;7B</xref>), and we built the classifier. The confusion matrix for the training and validation groups and four external validation sets (GSE30219, GSE31210, GSE50081, and GSE72094) are shown in <xref ref-type="fig" rid="F7">Figures 7C&#x2013;H</xref>. In TCGA validation group, the accuracy, precision, recall, F1 score, and AUC for the classifier was 0.94, 0.93, 0.91, 0.92, and 0.94, respectively. In GSE30219, the accuracy, precision, recall, F1 score, and AUC for the classifier was 0.91, 0.84, 0.90, 0.87, and 0.91, respectively. In GSE31210, the accuracy, precision, recall, F1 score, and AUC for the classifier was 0.92, 0.88, 0.87, 0.87, and 0.90, respectively. In GSE50081, the accuracy, precision, recall, F1 score, and AUC for the classifier was 0.86, 0.94, 0.76, 0.84, and 0.86, respectively. In GSE72094, the accuracy, precision, recall, F1 score, and AUC for the classifier was 0.91, 0.96, 0.82, 0.88, and 0.90, respectively. The abovementioned result indicated that the classifier predictor we built had excellent performance and good generalization capability, and it could be instructive for the classification of early-stage LUAD patients.</p>
<fig id="F7" position="float">
<label>FIGURE 7</label>
<caption>
<p>Construction and validation of the subtype predictor. <bold>(A)</bold> Venn diagram identified 24 genes shared by ElasticNet, SVM-RFE, RFB, and XGBoost machine learning. <bold>(B)</bold> Coefficient of the 21 common genes shared by all studying cohorts. The combination of these 21 genes was used to generate the subtype predictor using logistic regression. <bold>(C&#x2013;H)</bold> Confusion matrices of binary results of the subtype predictor for TCGA training cohort, TCGA validation cohort, GSE30219, GSE31210, GSE50081, and GSE72094.</p>
</caption>
<graphic xlink:href="fcell-10-769711-g007.tif"/>
</fig>
</sec>
<sec id="s3-6">
<title>Epigenetic Differences Between C1 and C2</title>
<p>Recent studies have shown that the epigenetic alterations are associated with immune evasion and tumor phenotype (<xref ref-type="bibr" rid="B8">Dawson and Kouzarides, 2012</xref>). Hence, we performed somatic mutation and CNA (copy number alteration) analysis to explore the difference between C1 and C2. Patients in C1 tended to have a higher TMB (tumor mutation burden) as compared to those in C2 (<xref ref-type="fig" rid="F8">Figure&#x20;8C</xref>, Wilcoxon test, <italic>p</italic>&#x20;&#x3c; 0.001). The top 20 genes with the highest mutant frequency in each cluster are shown in <xref ref-type="fig" rid="F8">Figures 8A&#x2013;B</xref>, and there appeared to be little difference between C1 and C2. We further analyzed the mutation condition of known driver genes for LUAD and mutated genes enriched in C1. For the common driver genes in LUAD (including EGFR, ALK, ROS1, RET, MET, BRAF, KRAS, PIK3CA, and NRG1), only ROS1 had different proportion of mutation between C1 and C2 (<xref ref-type="fig" rid="F8">Figure&#x20;8D</xref>, <xref ref-type="sec" rid="s10">Supplementary Figure S7-8</xref>, <xref ref-type="sec" rid="s10">Supplementary Table S6</xref>). In addition, there were 11 representative mutated genes enriched in C1 (namely, TTN, PTPRB, FMN2, TP53, KCNB2, RYR3, CSMD3, SORCS1, PROX1, NELL1, and RYR2, <xref ref-type="fig" rid="F8">Figure&#x20;8E</xref>, <xref ref-type="sec" rid="s10">Supplementary Figure S9</xref>, <xref ref-type="sec" rid="s10">Supplementary Table S6</xref>). Afterward, we calculated and compared the CNA burden at the focal and arm level. Amplifications and deletions within chromosomal regions in each cluster were detected using GISTIC 2.0 (<xref ref-type="sec" rid="s10">Supplementary Figure S10</xref>). Patients in the C2 had a lower burden of gain or loss at the arm or focal level (<xref ref-type="fig" rid="F8">Figures 8F&#x2013;I</xref>, Wilcoxon test; focal-level gain burden: &#x3c;0.001; focal-level loss burden: &#x3c;0.001; arm-level gain burden: &#x3c;0.001; arm-level loss burden: &#x3c;0.001), which was consistent with the previous notion that copy number alteration was related to immunotherapy resistance (<xref ref-type="bibr" rid="B4">Bassaganyas et&#x20;al., 2020</xref>). All these underlying differences might be the cause of the different tumor phenotypes between C1 and C2. In addition, regarding the EGFR mutant, we found five types of mutations in these samples (Frame_shift_Del, In_Frame_Del, In_Frame_Ins, Missense_Mutation, and Nonsense_Mutation). Among these mutation types, most of them showed no difference between patients in C1 and C2 (<xref ref-type="sec" rid="s10">Supplementary Table S7</xref>, Frame_shift_Del, C1: 0%; C2: 0.43%. In_Frame_Ins, C1: 0%; C2: 1.30%. Missense_Mutation, C1: 10.06%; C2: 12.17%. Nonsense_Mutation, C1: 0%; C2: 0.43%). Notably, at a 90% confidence interval, the frequency of EGFR in-frame deletion (In_Frame_Del) was higher in patients in C2 than that in C1 (C1:1.89%; C2: 6.09%). Previous studies have suggested that NSCLC patients with EGFR mutations are not suitable for immunotherapy. Meanwhile, patients with EGFR mutation who benefited from anti-PD (L)1 have been reported in some case reports. In our study, patients in cluster 2 tend to be more likely to benefit from immunotherapy, which may be due to the MATH-based classification. However, more studies are desired to screen the beneficiary population.</p>
<fig id="F8" position="float">
<label>FIGURE 8</label>
<caption>
<p>Comparisons of somatic variations and copy number alteration burden between C1 and C2. <bold>(A&#x2013;B)</bold> Waterfall plots showed the top 20 mutated genes in C1 and C2. <bold>(C)</bold> Comparison of TMB between C1 and C2, and patients in C1 showed a higher TMB. <bold>(D)</bold> Mutation landscape of common driver genes of LUAD in C1 and C2. <bold>(E)</bold> Top 11 mutated genes enriched in patients in C1. <bold>(F&#x2013;I)</bold> Comparison of CNA burden at the focal or arm level between C1 and C2.</p>
</caption>
<graphic xlink:href="fcell-10-769711-g008.tif"/>
</fig>
<p>Then, we compared the expression of driver genes in different immune cells (B&#x20;cells, CD4&#x2b;T&#x20;cells, CD8&#x2b;T&#x20;cells, DCs, and macrophages) between anti-PD1 responders and non-responders (treated with pembrolizumab or cemiplimab) in scRNA-seq data (GSE123813 cohort). The result showed that the responder B&#x20;cells had a higher expression of BRAF and a lower expression of KRAS than the non-responders. Moreover, the expression of KRAS and PIK3CA in CD4&#x2b;T&#x20;cells was lower than that in the non-responders (<xref ref-type="sec" rid="s10">Supplementary Table S8</xref>, <xref ref-type="sec" rid="s10">Supplementary Figure&#x20;S11</xref>).</p>
</sec>
<sec id="s3-7">
<title>Identification of Potential Drugs for Patients in C1</title>
<p>Two drug sensitivity profiles were generated after preprocessing the AUC files of CTRP and PRISM databases. Then, a ridge regression model was used (&#x201c;pRRophetic&#x201d; package in R) to predict the drug sensitivity of each sample in TCGA cohort (N &#x3d; 389). For every sample, we obtained the AUC values of each compound contained in a certain database (CTRP or PRISM). Prior to further analysis, we attempted to demonstrate the reliability of drug sensitivity data. Patients in TCGA cohorts were assigned into two groups according to their EGFR alteration. We observed that patients with EGFR alteration showed lower AUC values of Gefitini than those without alteration both in CTRP and PRISM (<xref ref-type="fig" rid="F9">Figures 9A&#x2013;B</xref>), which was consistent with the clinical effect of Gefitini. Next, we identified the compounds (<xref ref-type="fig" rid="F9">Figures 9C&#x2013;D</xref>) with lower AUC values in C1 (log2FC &#x3e; 0.2, <italic>p</italic>-value&#x3c;0.05, <xref ref-type="sec" rid="s10">Supplementary Table S9-10</xref>), including three PRISM-derived compounds (vincristine, gemcitabine, and cabazitaxel) and seven CTRP-derived compounds (vincristine, SB-743921, paclitaxel, leptomycin B, KX2-391, GSK461364, and BI-2536). These nine compounds all had lower AUC values in C1, indicating that patients in C1 had increased sensitivity to the corresponding treatment and might serve as the candidate potential therapeutic drug for patients in&#x20;C1.</p>
<fig id="F9" position="float">
<label>FIGURE 9</label>
<caption>
<p>Identification of a potential agent with higher sensitivity for patients in C1. <bold>(A&#x2013;B)</bold> Comparison of predicted Gefitini sensitivity between EGFR altered and unaltered groups. <bold>(C)</bold> Results of drug sensitivity analysis of three PRISM-derived compounds (vincristine, gemcitabine, and cabazitaxel). <bold>(D)</bold> Results of drug sensitivity analysis of seven CTRP-derived compounds (vincristine, SB-743921, paclitaxel, leptomycin B, KX2-391, GSK461364, and BI-2536). <bold>(E)</bold> CMap score of three candidate compounds (BI-2536, gemcitabine, and vincristine). <bold>(F&#x2013;H)</bold> Comparison of estimated IC<sub>50</sub> for BI-2536, gemcitabine, and paclitaxel in C1 and C2.</p>
</caption>
<graphic xlink:href="fcell-10-769711-g009.tif"/>
</fig>
<p>To explore the most reliable therapeutic compounds, we queried CMap (connectivity map) and GDSC (the Genomics of Drug Sensitivity in Cancer) and performed drug sensitivity analysis. As shown in the figure (<xref ref-type="fig" rid="F9">Figure&#x20;9E</xref>), among candidate compounds identified before, BI-2536 and gemcitabine showed relatively low CMap scores (Fig, BI-2536: 80.96; gemcitabine: 96.23), indicating therapeutic potential; and among three compounds in GDSC overlapped in the candidate drugs, only BI-2536 showed a lower estimated IC<sub>50</sub> in patients in C1 than that in C2 (<xref ref-type="fig" rid="F9">Figure&#x20;9F</xref>-H, Wilcoxon test, <italic>p</italic>-value, BI-2536: 0.0014; gemcitabine: 0.3200; paclitaxel: 0.4130). The abovementioned results indicated that BI-2536 might be the promising potential treatment compound in patients in C1. The potential mechanism may be due to higher expression of PLK1 in the C1 cluster (<xref ref-type="sec" rid="s10">Supplementary Table&#x20;S11</xref>).</p>
</sec>
</sec>
<sec sec-type="discussion" id="s4">
<title>Discussion</title>
<p>Intratumor heterogeneity (ITH) is a common phenomenon existing in all kinds of tumors (<xref ref-type="bibr" rid="B1">Andor et&#x20;al., 2016</xref>). According to previous studies, increased ITH is correlated with poor clinical outcomes and has a negative association with immune infiltration (<xref ref-type="bibr" rid="B11">Hua et&#x20;al., 2020</xref>). Besides, ITH has been reported to have an inverse association with T-cell immunoreactivity and sensitivity to immune checkpoint blockade (<xref ref-type="bibr" rid="B22">McGranahan et&#x20;al., 2016</xref>). Thus, the analysis of ITH may create a new approach for cancer treatment. In our early-stage LUAD cohort, we used MATH as a measure of ITH quantification. We utilized TIMER and ESTIMATE algorithms to infer the immune infiltration pattern, and MATH was found to have negative correlation with the abundance of immune cells (including B&#x20;cell, CD4 T&#x20;cell, CD8 T&#x20;cell, dendritic cell, macrophage, and neutrophils). Patients with high MATH tend to have a poor overall survival outcome. Also, by using the OCLR algorithm, we calculated the stemness indexes for each patient, and a positive correlation was found between MATH and cancer stemness. These results are consistent with those of previous studies (<xref ref-type="bibr" rid="B24">Miranda et&#x20;al., 2019</xref>). In order to explore the ITH at a deeper level, an unsupervised consensus clustering was performed based on expression profiles of MATH-related DEGs. Early-stage LUAD patients in the main cohort had been classified into two groups (C1 and C2), and these two groups showed distinct characteristics. Specifically, patients in C2 had a lower MATH score than those in C1, indicating patients in C1 had higher ITH, while C1 had lower abundance of B&#x20;cell, CD4 T&#x20;cell, CD8 T&#x20;cell, macrophage, dendritic cell, and neutrophil. To predict the likelihood of immunotherapy response in patients in C1 and C2, we compared the expression profiles of PD1/PDL1/PDL2 and CTLA-4/CD80/CD86 between C1 and C2, and three immunotherapy-related signatures were calculated using ssGSEA. The result revealed that patients in C2 had higher expression of immune checkpoint molecules and higher enrichment of immunotherapy-related signatures, indicating that patients in C2 were more likely to benefit from immunotherapy, while patients in C1 had the opposite. We further used the TIDE algorithm to predict the immunotherapy response, and it showed a consistent outcome. In addition, we observed the distinct clinical overall survival outcome between C1 and C2 across the main cohort and four independent validation cohorts (GSE30219, GSE31210, GSE50081, and GSE72094). Patients in C2 had an apparent survival advantage compared to patients in C1. In the end, drug analysis was conducted to find the potential treatment for high ITH patients (patients in C1). The results revealed that BI-2536 might have therapeutic potential for patients in&#x20;C1.</p>
<p>In the current study, we have established two models using multiple machine learning algorithms (combined SVM-RFE, ElasticNet, XGBoost, and RFB): the early-stage LUAD diagnosis model and the early-stage LUAD classification predictor. For the former, the five-gene&#x2013;based prognosis model (including B3GNT3, PLEK2, GALNT7, GRK5, and SLC39A8) reached an AUC of 0.982 in the internal validation cohort and AUC of 0.817 and 0.850 in the two external validation cohorts. B3GNT3 is an important member of B3GlcNacT family, and it was found important in the development of lung cancer (<xref ref-type="bibr" rid="B32">Sun et&#x20;al., 2020</xref>). In addition, PLEK2 and GALNT7 have been reported to function as oncogenes in gall bladder cancer and colorectal cancer, respectively (<xref ref-type="bibr" rid="B16">Li et&#x20;al., 2018</xref>; <xref ref-type="bibr" rid="B29">Shen H et&#x20;al., 2019</xref>). The coefficients of these three molecules in our prognosis model are positive, which refers to cancerous tissue prediction, indicating that they might play important roles in the development of lung adenocarcinoma. Indeed, there are many studies on the prognostic model for early-stage LUAD. Generally, these models were based on the prognosis of LUAD patients. In our study, we explored the MATH-based LUAD subtypes and built a classification model. Compared with previous studies, (e.g., Lu et&#x20;al. <italic>A Prognostic Model for overall survival of patients with early-stage non&#x2013;small cell lung cancer: a multicentre, retrospective study The Lancet digital health</italic>; and Krzystanek et&#x20;al. <italic>A robust prognostic gene expression signature for early-stage lung adenocarcinoma. Biomarker Research</italic>) (<xref ref-type="bibr" rid="B14">Krzystanek et&#x20;al., 2016</xref>; <xref ref-type="bibr" rid="B20">Lu et&#x20;al., 2020</xref>), there are some advantages and disadvantages of our research. For example, in the study by Lu et&#x20;al., more omics data were included (eg. H&#x26;E&#x2013;stained histology images, pathological parameters), which made the results more reliable. Moreover, these two research studies both used relatively large cohorts (Lu et&#x20;alm multicenter, N &#x3d; 1,057, Krzystanek et&#x20;al., seven cohorts). In spite of these shortcomings, our study has some advantages. It is the first classification of early-stage LUAD based on MATH. We developed the classifier using current high-performance machine learning algorithms and verified its generalization ability. We tried to generate a small panel to help make a quick diagnosis and classification of LUAD at an early stage. However, its clinical translation value and application need further research. For the 21-gene&#x2013;based classification model, we used several indices, such as accuracy, precision, recall, and F1 score, to measure the performance of our model across the internal validation cohort and four independent validation cohorts, and the result revealed its good predictive ability. It reached AUCs of 0.94, 0.91, 0.90, 0.86, and 0.90 in the internal validation cohort and independent validation cohorts (GSE30219, GSE31210, GSE50081, and GSE72094). Notably, the false-positive rate and the false-negative rate of our model were 4.29% and 8.51% in the internal validation cohort, 9.10% and 10.00% in GSE30219, 6.00% and 13.33% in GSE31210, 4.69% and 23.80% in GSE50081, and 2.56% and 18.00% in GSE72094, respectively indicating good generalization ability and application value. The main advantage of our model lies in its simplicity: a small gene panel could be designed for the detection and classification of early-stage LUAD. From this, we could get quick information about the feasibility of developing LUAD and which classification it belongs to. Since the two clusters of early-stage LUAD have distinct characteristics and prognosis, the model could help clinicians make appropriate treatment decisions. Directly, the combination of these molecules (shown in <xref ref-type="fig" rid="F7">Figure&#x20;7B</xref>) could make a classification of NSCLC patients at an early stage. In our study, we elaborated on the clinical significance of this classification. In terms of individual molecules, most of them were studied in human cancers, including lung cancer (e.g., AQP1, AQP4, IL33, and PEBP4). For example, PEBP4 could promote the proliferation, migration, and EMT of lung cancer. Several studies suggested that aquaporin1 and aquaporin4 are related to the invasion of lung cancer. As for IL33, previous studies suggested that it could promote the occurrence and development of lung cancer. On the other hand, some studies suggested that it (IL33) could activate NK and CD8&#x2b;T&#x20;cells to suppress lung cancer. In general, these &#x201c;candidate genes&#x201d; could affect the biological function of lung cancer and further influence cancer phenotypes. In terms of clinical application, the combination of these genes is more meaningful. However, its clinical translation value and application need further research.</p>
<p>In conclusion, our study provided a new strategy for clinicians to make a quick preliminary assisting diagnosis of early-stage LUAD and make a patient classification at the intratumor heterogeneity level. Yet, this study has some unavoidable limitations and shortcomings. We found that patients in C1 exhibited a higher TMB and copy number burden and were enriched in certain mutations (such as TP53). However, we only depicted these characteristics in these involved clusters, and the correlation analysis did not reveal strong correlations. The causality was hard to be confirmed since our study is a retrospective analysis. The comparison of driver genes in immune cells between immunotherapy responders and non-responders was based on the sc-RNA seq dataset (GSE123813). Experimental validation needs to be further studied. In addition, though we used multiple cohorts to ensure the generalization ability of our findings, large sample clinical trials are needed to further confirm the clinical application&#x20;value.</p>
</sec>
</body>
<back>
<sec id="s5">
<title>Data Availability Statement</title>
<p>The datasets presented in this study can be found in online repositories. The names of the repository/repositories and accession number(s) can be found in the article/<xref ref-type="sec" rid="s10">Supplementary Material</xref>.</p>
</sec>
<sec id="s6">
<title>Author Contributions</title>
<p>LL and LC conceived the study. LC and TC acquired and analyzed data. ZY, HY, LJ, and YQ participated in interpreting the data. LC and GF drafted the manuscript. LC, TC, and HY participated in preparing the figures. All authors reviewed and revised this study and gave their final approval of the submitted manuscript.</p>
</sec>
<sec id="s7">
<title>Funding</title>
<p>This study was supported by the National Key R&#x26;D Program of China (Grant No.2016YFC1303800) and the National Natural Science Foundation of China (Grant Nos. 81773056 and 82073179).</p>
</sec>
<sec sec-type="COI-statement" id="s8">
<title>Conflict of Interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="disclaimer" id="s9">
<title>Publisher&#x2019;s Note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors, and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec id="s10">
<title>Supplementary Material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fcell.2022.769711/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fcell.2022.769711/full&#x23;supplementary-material</ext-link>
</p>
<supplementary-material xlink:href="Table2.XLSX" id="SM1" mimetype="application/XLSX" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Table1.DOCX" id="SM2" mimetype="application/DOCX" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="DataSheet1.PDF" id="SM3" mimetype="application/PDF" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Andor</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Graham</surname>
<given-names>T. A.</given-names>
</name>
<name>
<surname>Jansen</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Xia</surname>
<given-names>L. C.</given-names>
</name>
<name>
<surname>Aktipis</surname>
<given-names>C. A.</given-names>
</name>
<name>
<surname>Petritsch</surname>
<given-names>C.</given-names>
</name>
<etal/>
</person-group> (<year>2016</year>). <article-title>Pan-cancer Analysis of the Extent and Consequences of Intratumor Heterogeneity</article-title>. <source>Nat. Med.</source> <volume>22</volume> (<issue>1</issue>), <fpage>105</fpage>&#x2013;<lpage>113</lpage>. <pub-id pub-id-type="doi">10.1038/nm.3984</pub-id> </citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ayers</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Lunceford</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Nebozhyn</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Murphy</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Loboda</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Kaufman</surname>
<given-names>D. R.</given-names>
</name>
<etal/>
</person-group> (<year>2017</year>). <article-title>IFN-&#x3b3;-related mRNA Profile Predicts Clinical Response to PD-1 Blockade</article-title>. <source>J.&#x20;Clin. Invest.</source> <volume>127</volume> (<issue>8</issue>), <fpage>2930</fpage>&#x2013;<lpage>2940</lpage>. <pub-id pub-id-type="doi">10.1172/JCI91190</pub-id> </citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Baba</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Uramoto</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Takenaka</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Oka</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Shigematsu</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Shimokawa</surname>
<given-names>H.</given-names>
</name>
<etal/>
</person-group> (<year>2012</year>). <article-title>The Tumour Shape of Lung Adenocarcinoma Is Related to the Postoperative Prognosis</article-title>. <source>Interact. Cardiovasc. Thorac. Surg.</source> <volume>15</volume> (<issue>1</issue>), <fpage>73</fpage>&#x2013;<lpage>76</lpage>. <pub-id pub-id-type="doi">10.1093/icvts/ivs055</pub-id> </citation>
</ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bassaganyas</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Pinyol</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Esteban-Fabr&#xf3;</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Torrens</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Torrecilla</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Willoughby</surname>
<given-names>C. E.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Copy-Number Alteration Burden Differentially Impacts Immune Profiles and Molecular Features of Hepatocellular Carcinoma</article-title>. <source>Clin. Cancer Res.</source> <volume>26</volume> (<issue>23</issue>), <fpage>6350</fpage>&#x2013;<lpage>6361</lpage>. <pub-id pub-id-type="doi">10.1158/1078-0432.CCR-20-1497</pub-id> </citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bray</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Ferlay</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Soerjomataram</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Siegel</surname>
<given-names>R. L.</given-names>
</name>
<name>
<surname>Torre</surname>
<given-names>L. A.</given-names>
</name>
<name>
<surname>Jemal</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Global Cancer Statistics 2018: GLOBOCAN Estimates of Incidence and Mortality Worldwide for 36 Cancers in 185 Countries</article-title>. <source>CA Cancer J.&#x20;Clin.</source> <volume>68</volume> (<issue>6</issue>), <fpage>394</fpage>&#x2013;<lpage>424</lpage>. <pub-id pub-id-type="doi">10.3322/caac.21492</pub-id> </citation>
</ref>
<ref id="B6">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cho</surname>
<given-names>J.-W.</given-names>
</name>
<name>
<surname>Hong</surname>
<given-names>M. H.</given-names>
</name>
<name>
<surname>Ha</surname>
<given-names>S.-J.</given-names>
</name>
<name>
<surname>Kim</surname>
<given-names>Y.-J.</given-names>
</name>
<name>
<surname>Cho</surname>
<given-names>B. C.</given-names>
</name>
<name>
<surname>Lee</surname>
<given-names>I.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Genome-wide Identification of Differentially Methylated Promoters and Enhancers Associated with Response to Anti-PD-1 Therapy in Non-small Cell Lung Cancer</article-title>. <source>Exp. Mol. Med.</source> <volume>52</volume> (<issue>9</issue>), <fpage>1550</fpage>&#x2013;<lpage>1563</lpage>. <pub-id pub-id-type="doi">10.1038/s12276-020-00493-8</pub-id> </citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Corsello</surname>
<given-names>S. M.</given-names>
</name>
<name>
<surname>Nagari</surname>
<given-names>R. T.</given-names>
</name>
<name>
<surname>Spangler</surname>
<given-names>R. D.</given-names>
</name>
<name>
<surname>Rossen</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Kocak</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Bryan</surname>
<given-names>J.&#x20;G.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Discovering the Anticancer Potential of Non-oncology Drugs by Systematic Viability Profiling</article-title>. <source>Nat. Cancer</source> <volume>1</volume> (<issue>2</issue>), <fpage>235</fpage>&#x2013;<lpage>248</lpage>. <pub-id pub-id-type="doi">10.1038/s43018-019-0018-6</pub-id> </citation>
</ref>
<ref id="B8">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dawson</surname>
<given-names>M. A.</given-names>
</name>
<name>
<surname>Kouzarides</surname>
<given-names>T.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Cancer Epigenetics: from Mechanism to Therapy</article-title>. <source>Cell</source> <volume>150</volume> (<issue>1</issue>), <fpage>12</fpage>&#x2013;<lpage>27</lpage>. <pub-id pub-id-type="doi">10.1016/j.cell.2012.06.013</pub-id> </citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Duma</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Santana-Davila</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Molina</surname>
<given-names>J.&#x20;R.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Non-Small Cell Lung Cancer: Epidemiology, Screening, Diagnosis, and Treatment</article-title>. <source>Mayo Clinic Proc.</source> <volume>94</volume> (<issue>8</issue>), <fpage>1623</fpage>&#x2013;<lpage>1640</lpage>. <pub-id pub-id-type="doi">10.1016/j.mayocp.2019.01.013</pub-id> </citation>
</ref>
<ref id="B10">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gan</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Luo</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Dai</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Lin</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>X.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Identification of Gene Signatures for Diagnosis and Prognosis of Hepatocellular Carcinomas Patients at Early Stage</article-title>. <source>Front. Genet.</source> <volume>11</volume>, <fpage>11 857</fpage>. <pub-id pub-id-type="doi">10.3389/fgene.2020.00857</pub-id> </citation>
</ref>
<ref id="B11">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hua</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Pesatori</surname>
<given-names>A. C.</given-names>
</name>
<name>
<surname>Consonni</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Caporaso</surname>
<given-names>N. E.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>T.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Genetic and Epigenetic Intratumor Heterogeneity Impacts Prognosis of Lung Adenocarcinoma</article-title>. <source>Nat. Commun.</source> <volume>11</volume> (<issue>1</issue>), <fpage>2459</fpage>. <pub-id pub-id-type="doi">10.1038/s41467-020-16295-5</pub-id> </citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hubble</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Demeter</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Jin</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Mao</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Nitzberg</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Reddy</surname>
<given-names>T. B. K.</given-names>
</name>
<etal/>
</person-group> (<year>2009</year>). <article-title>Implementation of GenePattern within the Stanford Microarray Database</article-title>. <source>Nucleic Acids Res.</source> <volume>37</volume> (<issue>Database issue</issue>), <fpage>D898</fpage>&#x2013;<lpage>D901</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkn786</pub-id> </citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jiang</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Gu</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Pan</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Fu</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Sahu</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Hu</surname>
<given-names>X.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>Signatures of T&#x20;Cell Dysfunction and Exclusion Predict Cancer Immunotherapy Response</article-title>. <source>Nat. Med.</source> <volume>24</volume> (<issue>10</issue>), <fpage>1550</fpage>&#x2013;<lpage>1558</lpage>. <pub-id pub-id-type="doi">10.1038/s41591-018-0136-1</pub-id> </citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Krzystanek</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Moldvay</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Sz&#xfc;ts</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Szallasi</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Eklund</surname>
<given-names>A. C.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>A Robust Prognostic Gene Expression Signature for Early Stage Lung Adenocarcinoma</article-title>. <source>Biomark Res.</source> <volume>4</volume>, <fpage>4</fpage>. <pub-id pub-id-type="doi">10.1186/s40364-016-0058-3</pub-id> </citation>
</ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Liang</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Dai</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Cai</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Xu</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>X.</given-names>
</name>
<etal/>
</person-group> (<year>2016</year>). <article-title>Prognostic Impact of Programed Cell Death-1 (PD-1) and PD-Ligand 1 (PD-L1) Expression in Cancer Cells and Tumor Infiltrating Lymphocytes in Colorectal Cancer</article-title>. <source>Mol. Cancer</source> <volume>15</volume> (<issue>1</issue>), <fpage>55</fpage>. <pub-id pub-id-type="doi">10.1186/s12943-016-0539-x</pub-id> </citation>
</ref>
<ref id="B16">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zeng</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Hu</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Pan</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Shan</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>B.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>Long Non-coding RNA-SNHG7 Acts as a Target of miR-34a to Increase GALNT7 Level and Regulate PI3K/Akt/mTOR Pathway in Colorectal Cancer Progression</article-title>. <source>J.&#x20;Hematol. Oncol.</source> <volume>11</volume> (<issue>1</issue>), <fpage>89</fpage>. <pub-id pub-id-type="doi">10.1186/s13045-018-0632-2</pub-id> </citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Fu</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Zeng</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Cohen</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>Q.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>TIMER2.0 for Analysis of Tumor-Infiltrating Immune Cells</article-title>. <source>Nucleic Acids Res.</source> <volume>48</volume> (<issue>W1</issue>), <fpage>W509</fpage>&#x2013;<lpage>W514</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkaa407</pub-id> </citation>
</ref>
<ref id="B18">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Cui</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Qu</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Chater</surname>
<given-names>J.&#x20;M.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>L.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Extended Application of Genomic Selection to Screen Multiomics Data for Prognostic Signatures of Prostate Cancer</article-title>. <source>Brief Bioinform</source> <volume>22</volume> (<issue>3</issue>), <fpage>bbaa197</fpage>. <pub-id pub-id-type="doi">10.1093/bib/bbaa197</pub-id> </citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lian</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Han</surname>
<given-names>Y. P.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>Y. C.</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Yan</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>Q. F.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>Integrative Analysis of Gene Expression and DNA Methylation through One&#x2010;class Logistic Regression Machine Learning Identifies Stemness Features in Medulloblastoma</article-title>. <source>Mol. Oncol.</source> <volume>13</volume> (<issue>10</issue>), <fpage>2227</fpage>&#x2013;<lpage>2245</lpage>. <pub-id pub-id-type="doi">10.1002/1878-0261.12557</pub-id> </citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lu</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Bera</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Prasanna</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Xu</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Janowczyk</surname>
<given-names>A.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>A Prognostic Model for Overall Survival of Patients with Early-Stage Non-small Cell Lung Cancer: a Multicentre, Retrospective Study</article-title>. <source>Lancet Digital Health</source> <volume>2</volume> (<issue>11</issue>), <fpage>e594</fpage>&#x2013;<lpage>e606</lpage>. <pub-id pub-id-type="doi">10.1016/s2589-7500(20)30225-9</pub-id> </citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>McDonald</surname>
<given-names>K.-A.</given-names>
</name>
<name>
<surname>Kawaguchi</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Qi</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Peng</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Asaoka</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Young</surname>
<given-names>J.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>Tumor Heterogeneity Correlates with Less Immune Response and Worse Survival in Breast Cancer Patients</article-title>. <source>Ann. Surg. Oncol.</source> <volume>26</volume> (<issue>7</issue>), <fpage>2191</fpage>&#x2013;<lpage>2199</lpage>. <pub-id pub-id-type="doi">10.1245/s10434-019-07338-3</pub-id> </citation>
</ref>
<ref id="B22">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>McGranahan</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Furness</surname>
<given-names>A. J.&#x20;S.</given-names>
</name>
<name>
<surname>Rosenthal</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Ramskov</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Lyngaa</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Saini</surname>
<given-names>S. K.</given-names>
</name>
<etal/>
</person-group> (<year>2016</year>). <article-title>Clonal Neoantigens Elicit T&#x20;Cell Immunoreactivity and Sensitivity to Immune Checkpoint Blockade</article-title>. <source>Science</source> <volume>351</volume> (<issue>6280</issue>), <fpage>1463</fpage>&#x2013;<lpage>1469</lpage>. <pub-id pub-id-type="doi">10.1126/science.aaf1490</pub-id> </citation>
</ref>
<ref id="B23">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Messina</surname>
<given-names>J.&#x20;L.</given-names>
</name>
<name>
<surname>Fenstermacher</surname>
<given-names>D. A.</given-names>
</name>
<name>
<surname>Eschrich</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Qu</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Berglund</surname>
<given-names>A. E.</given-names>
</name>
<name>
<surname>Lloyd</surname>
<given-names>M. C.</given-names>
</name>
<etal/>
</person-group> (<year>2012</year>). <article-title>12-Chemokine Gene Signature Identifies Lymph Node-like Structures in Melanoma: Potential for Patient Selection for Immunotherapy?</article-title> <source>Sci. Rep.</source> <volume>2</volume>, <fpage>2 765</fpage>. <pub-id pub-id-type="doi">10.1038/srep00765</pub-id> </citation>
</ref>
<ref id="B24">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Miranda</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Hamilton</surname>
<given-names>P. T.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>A. W.</given-names>
</name>
<name>
<surname>Pattnaik</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Becht</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Mezheyeuski</surname>
<given-names>A.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>Cancer Stemness, Intratumoral Heterogeneity, and Immune Response across Cancers</article-title>. <source>Proc. Natl. Acad. Sci. USA</source> <volume>116</volume> (<issue>18</issue>), <fpage>9020</fpage>&#x2013;<lpage>9029</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.1818210116</pub-id> </citation>
</ref>
<ref id="B25">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Musa</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Ghoraie</surname>
<given-names>L. S.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>S.-D.</given-names>
</name>
<name>
<surname>Galzko</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Yli-Harja</surname>
<given-names>O.</given-names>
</name>
<name>
<surname>Dehmer</surname>
<given-names>M.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>A Review of Connectivity Map and Computational Approaches in Pharmacogenomics</article-title>. <source>Brief Bioinform</source> <volume>19</volume> (<issue>3</issue>), <fpage>bbw112</fpage>&#x2013;<lpage>23</lpage>. <pub-id pub-id-type="doi">10.1093/bib/bbw112</pub-id> </citation>
</ref>
<ref id="B26">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ran</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Xiao</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Teng</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Cheng</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>H.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Low Intratumor Heterogeneity Correlates with Increased Response to PD-1 Blockade in Renal Cell Carcinoma</article-title>. <source>Ther. Adv. Med. Oncol.</source> <volume>12</volume>, <fpage>1758835920977117</fpage>. <pub-id pub-id-type="doi">10.1177/1758835920977117</pub-id> </citation>
</ref>
<ref id="B27">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rees</surname>
<given-names>M. G.</given-names>
</name>
<name>
<surname>Seashore-Ludlow</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Cheah</surname>
<given-names>J.&#x20;H.</given-names>
</name>
<name>
<surname>Adams</surname>
<given-names>D. J.</given-names>
</name>
<name>
<surname>Price</surname>
<given-names>E. V.</given-names>
</name>
<name>
<surname>Gill</surname>
<given-names>S.</given-names>
</name>
<etal/>
</person-group> (<year>2016</year>). <article-title>Correlating Chemical Sensitivity and Basal Gene Expression Reveals Mechanism of Action</article-title>. <source>Nat. Chem. Biol.</source> <volume>12</volume> (<issue>2</issue>), <fpage>109</fpage>&#x2013;<lpage>116</lpage>. <pub-id pub-id-type="doi">10.1038/nchembio.1986</pub-id> </citation>
</ref>
<ref id="B28">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rocco</surname>
<given-names>J.&#x20;W.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Mutant Allele Tumor Heterogeneity (MATH) and Head and Neck Squamous Cell Carcinoma</article-title>. <source>Head Neck Pathol.</source> <volume>9</volume> (<issue>1</issue>), <fpage>1</fpage>&#x2013;<lpage>5</lpage>. <pub-id pub-id-type="doi">10.1007/s12105-015-0617-1</pub-id> </citation>
</ref>
<ref id="B29">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shen H</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>He</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Lin</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Zhan</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Xu</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>X.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>PLEK2 Promotes Gallbladder Cancer Invasion and Metastasis through EGFR/CCL2 Pathway</article-title>. <source>J.&#x20;Exp. Clin. Cancer Res.</source> <volume>38</volume> (<issue>1</issue>), <fpage>247</fpage>. <pub-id pub-id-type="doi">10.1186/s13046-019-1250-8</pub-id> </citation>
</ref>
<ref id="B30">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shen R</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Feng</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Cheng</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Identification of Distinct Immune Subtypes in Colorectal Cancer Based on the Stromal Compartment</article-title>. <source>Front. Oncol.</source> <volume>9</volume>, <fpage>9 1497</fpage>. <pub-id pub-id-type="doi">10.3389/fonc.2019.01497</pub-id> </citation>
</ref>
<ref id="B31">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shroff</surname>
<given-names>G. S.</given-names>
</name>
<name>
<surname>de Groot</surname>
<given-names>P. M.</given-names>
</name>
<name>
<surname>Papadimitrakopoulou</surname>
<given-names>V. A.</given-names>
</name>
<name>
<surname>Truong</surname>
<given-names>M. T.</given-names>
</name>
<name>
<surname>Carter</surname>
<given-names>B. W.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Targeted Therapy and Immunotherapy in the Treatment of Non-small Cell Lung Cancer</article-title>. <source>Radiol. Clin. North Am.</source> <volume>56</volume> (<issue>3</issue>), <fpage>485</fpage>&#x2013;<lpage>495</lpage>. <pub-id pub-id-type="doi">10.1016/j.rcl.2018.01.012</pub-id> </citation>
</ref>
<ref id="B32">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sun</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Xian</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Zhou</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>B3GNT3, a Direct Target of miR-149-5p, Promotes Lung Cancer Development and Indicates Poor Prognosis of Lung Cancer</article-title>. <source>Cancer Manag. Res.</source> <volume>12</volume>, <fpage>2381</fpage>&#x2013;<lpage>2391</lpage>. <pub-id pub-id-type="doi">10.2147/CMAR.S236565</pub-id> </citation>
</ref>
<ref id="B33">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Thorsson</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Gibbs</surname>
<given-names>D. L.</given-names>
</name>
<name>
<surname>Brown</surname>
<given-names>S. D.</given-names>
</name>
<name>
<surname>Wolf</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Bortone</surname>
<given-names>D. S.</given-names>
</name>
<name>
<surname>Ou Yang</surname>
<given-names>T. H.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>The Immune Landscape of Cancer</article-title>. <source>Immunity</source> <volume>48</volume> (<issue>4</issue>), <fpage>812</fpage>. <pub-id pub-id-type="doi">10.1016/j.immuni.2018.03.023</pub-id> </citation>
</ref>
<ref id="B34">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>He</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>X.-S.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Antigen Presentation and Tumor Immunogenicity in Cancer Immunotherapy Response Prediction</article-title>. <source>Elife</source> <volume>8</volume>, <fpage>e49020</fpage>. <pub-id pub-id-type="doi">10.7554/eLife.49020</pub-id> </citation>
</ref>
<ref id="B35">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Xing</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Gao</surname>
<given-names>L.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Machine Learning Revealed Stemness Features and a Novel Stemness-Based Classification with Appealing Implications in Discriminating the Prognosis, Immunotherapy and Temozolomide Responses of 906 Glioblastoma Patients</article-title>. <source>Brief Bioinform</source> <volume>22</volume>, <fpage>bbab032</fpage>. <pub-id pub-id-type="doi">10.1093/bib/bbab032</pub-id> </citation>
</ref>
<ref id="B36">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yang</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Soares</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Greninger</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Edelman</surname>
<given-names>E. J.</given-names>
</name>
<name>
<surname>Lightfoot</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Forbes</surname>
<given-names>S.</given-names>
</name>
<etal/>
</person-group> (<year>2013</year>). <article-title>Genomics of Drug Sensitivity in Cancer (GDSC): a Resource for Therapeutic Biomarker Discovery in Cancer Cells</article-title>. <source>Nucleic Acids Res.</source> <volume>41</volume> (<issue>Database issue</issue>), <fpage>D955</fpage>&#x2013;<lpage>D961</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gks1111</pub-id> </citation>
</ref>
<ref id="B37">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Hsu</surname>
<given-names>P. J.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>Y.-S.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>Y.-G.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Dynamic Transcriptomic m6A Decoration: Writers, Erasers, Readers and Functions in RNA Metabolism</article-title>. <source>Cell Res.</source> <volume>28</volume> (<issue>6</issue>), <fpage>616</fpage>&#x2013;<lpage>624</lpage>. <pub-id pub-id-type="doi">10.1038/s41422-018-0040-8</pub-id> </citation>
</ref>
<ref id="B38">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yoshihara</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Shahmoradgoli</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Mart&#xed;nez</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Vegesna</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Kim</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Torres-Garcia</surname>
<given-names>W.</given-names>
</name>
<etal/>
</person-group> (<year>2013</year>). <article-title>Inferring Tumour Purity and Stromal and Immune Cell Admixture from Expression Data</article-title>. <source>Nat. Commun.</source> <volume>4</volume>, <fpage>4 2612</fpage>. <pub-id pub-id-type="doi">10.1038/ncomms3612</pub-id> </citation>
</ref>
<ref id="B39">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zappa</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Mousa</surname>
<given-names>S. A.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Non-small Cell Lung Cancer: Current Treatment and Future Advances</article-title>. <source>Transl. Lung Cancer Res.</source> <volume>5</volume> (<issue>3</issue>), <fpage>288</fpage>&#x2013;<lpage>300</lpage>. <pub-id pub-id-type="doi">10.21037/tlcr.2016.06.07</pub-id> </citation>
</ref>
</ref-list>
</back>
</article>