<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="2.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Oncol.</journal-id>
<journal-title>Frontiers in Oncology</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Oncol.</abbrev-journal-title>
<issn pub-type="epub">2234-943X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fonc.2023.1130092</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Oncology</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Integration of multi-omics data reveals a novel hybrid breast cancer subtype and its biomarkers</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Wang</surname>
<given-names>Zhen-zhen</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="author-notes" rid="fn003">
<sup>&#x2020;</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1361679"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Li</surname>
<given-names>Xu-hua</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="author-notes" rid="fn003">
<sup>&#x2020;</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2149231"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Wen</surname>
<given-names>Xiao-ling</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="author-notes" rid="fn003">
<sup>&#x2020;</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2139014"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Wang</surname>
<given-names>Na</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1760340"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Guo</surname>
<given-names>Yu</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Zhu</surname>
<given-names>Xu</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Fu</surname>
<given-names>Shu-heng</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Xiong</surname>
<given-names>Fei-fan</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Bai</surname>
<given-names>Jing</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="author-notes" rid="fn001">
<sup>*</sup>
</xref>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Gao</surname>
<given-names>Xiao-ling</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="author-notes" rid="fn001">
<sup>*</sup>
</xref>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Wang</surname>
<given-names>Hong-jiu</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<xref ref-type="author-notes" rid="fn001">
<sup>*</sup>
</xref>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>Key Laboratory of Tropical Translational Medicine of Ministry of Education, College of Biomedical Information and Engineering, Hainan Medical University</institution>, <addr-line>Haikou</addr-line>, <country>China</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>The Medical Laboratory Center, Hainan General Hospital</institution>, <addr-line>Haikou</addr-line>, <country>China</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>College of Bioinformatics Science and Technology, Harbin Medical University</institution>, <addr-line>Harbin</addr-line>, <country>China</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>Edited by: Maria Rosaria De Miglio, University of Sassari, Italy</p>
</fn>
<fn fn-type="edited-by">
<p>Reviewed by: Matteo Massidda, University of Sassari, Italy; Andrea Angius, Department of Biomedical Sciences (CNR), Italy</p>
</fn>
<fn fn-type="corresp" id="fn001">
<p>*Correspondence: Hong-jiu Wang, <email xlink:href="mailto:wanghongjiu@hainmc.edu.cn">wanghongjiu@hainmc.edu.cn</email>; Xiao-ling Gao, <email xlink:href="mailto:gaoxl008@hotmail.com">gaoxl008@hotmail.com</email>; Jing Bai, <email xlink:href="mailto:593003960@qq.com">593003960@qq.com</email>
</p>
</fn>
<fn fn-type="equal" id="fn003">
<p>&#x2020;These authors have contributed equally to this work and share first authorship</p>
</fn>
<fn fn-type="other" id="fn002">
<p>This article was submitted to Breast Cancer, a section of the journal Frontiers in Oncology</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>21</day>
<month>03</month>
<year>2023</year>
</pub-date>
<pub-date pub-type="collection">
<year>2023</year>
</pub-date>
<volume>13</volume>
<elocation-id>1130092</elocation-id>
<history>
<date date-type="received">
<day>23</day>
<month>12</month>
<year>2022</year>
</date>
<date date-type="accepted">
<day>06</day>
<month>03</month>
<year>2023</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2023 Wang, Li, Wen, Wang, Guo, Zhu, Fu, Xiong, Bai, Gao and Wang</copyright-statement>
<copyright-year>2023</copyright-year>
<copyright-holder>Wang, Li, Wen, Wang, Guo, Zhu, Fu, Xiong, Bai, Gao and Wang</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>Tumor heterogeneity in breast cancer hinders proper diagnosis and treatment, and the identification of molecular subtypes may help enhance the understanding of its heterogeneity. Therefore, we proposed a novel integrated multi-omics approach for breast cancer typing, which led to the identification of a hybrid subtype (Mix_Sub subtype) with a poor survival prognosis. This subtype is characterized by lower levels of the inflammatory response, lower tumor malignancy, lower immune cell infiltration, and higher T-cell dysfunction. Moreover, we found that cell-cell communication mediated by NCAM1-FGFR1 ligand-receptor interaction and cellular functional states, such as cell cycle, DNA damage, and DNA repair, were significantly altered and upregulated in patients with this subtype, and that such patients displayed greater sensitivity to targeted therapies. Subsequently, using differential genes among subtypes as biomarkers, we constructed prognostic risk models and subtype classifiers for the Mix_Sub subtype and validated their generalization ability in external datasets obtained from the GEO database, indicating their potential therapeutic and prognostic significance. These biomarkers also showed significant spatially variable expression in malignant tumor cells. Collectively, the identification of the Mix_Sub breast cancer subtype and its biomarkers, based on the driving relationship between omics, has deepened our understanding of breast cancer heterogeneity and facilitated the development of breast cancer precision therapy.</p>
</abstract>
<kwd-group>
<kwd>breast cancer</kwd>
<kwd>multi-omics</kwd>
<kwd>molecular subtypes</kwd>
<kwd>biomolecular markers</kwd>
<kwd>spatial variability</kwd>
</kwd-group>
<counts>
<fig-count count="10"/>
<table-count count="0"/>
<equation-count count="0"/>
<ref-count count="45"/>
<page-count count="16"/>
<word-count count="7170"/>
</counts>
</article-meta>
</front>
<body>
<sec id="s1" sec-type="intro">
<label>1</label>
<title>Introduction</title>
<p>Breast cancer is the most common malignancy with highly heterogeneous and has the second highest mortality rate among female tumors worldwide (<xref ref-type="bibr" rid="B1">1</xref>, <xref ref-type="bibr" rid="B2">2</xref>). The identification of novel molecular subtypes could help in the accurate diagnosis and personalized treatment of breast cancer (<xref ref-type="bibr" rid="B2">2</xref>, <xref ref-type="bibr" rid="B3">3</xref>).</p>
<p>Thus far, PAM50 intrinsic breast cancer subtypes, luminal A (LumA), luminal B (LumB), basal-like (Basal), HER2 over-expressed (HER2), and normal-like (<xref ref-type="bibr" rid="B4">4</xref>), which are categorized based on the mRNA expression profile of 50 genes, have received the most attention from BRCA experts, but this classification system was derived based on single-omics only. Therefore, some studies that reclassify breast cancer based on other single-omics data types have also deepened the understanding of breast cancer heterogeneity. For example, by effectively combining gene mutation profiles with unsupervised machine methods, three subtypes closely related to clinical information were identified, and effective classification models were developed, providing a new perspective for understanding cancer subtyping studies (<xref ref-type="bibr" rid="B5">5</xref>). Using a copy number variation (CNV) dataset, Andre et&#xa0;al. classified breast cancers into three subtypes associated with copy number abnormalities and identified a large number of previously unidentified regions of DNA copy number variation and identified potential therapeutic targets (<xref ref-type="bibr" rid="B6">6</xref>). Six molecular subtypes of breast cancer with distinct miRNA profiles were revealed based on miRNA expression profiles, illustrating that subtle differences in miRNAs among cancer subtypes can be used to differentiate subtypes and deepen the understanding of cancer heterogeneity (<xref ref-type="bibr" rid="B7">7</xref>). In short, the widespread use of various high-throughput omics data has identified breast cancer subtypes with specific molecular mechanisms and expanded the study of breast cancer typing, but the information provided by single-omics data is one-sided (<xref ref-type="bibr" rid="B8">8</xref>).</p>
<p>In recent years, the growing availability of multi-omics data, including genome and transcriptome, has led to unprecedented insight and resolution of cancer subtypes. The combination of multi-omics data allows a higher resolution of breast cancer subtypes (<xref ref-type="bibr" rid="B9">9</xref>). Several studies have been conducted to stratify BRCA patients based on multi-omics data integration analysis. For instance, a comprehensive correlation analysis of copy number variation data and gene expression data from 997 primary breast cancer tumors identified new subgroups with different clinical outcomes, which was validated in an external dataset containing 995 primary breast cancer patients (<xref ref-type="bibr" rid="B10">10</xref>). Similarly, the correlation of these two omics was analyzed by a new algorithm in another study, which also revealed a potentially novel subtype of breast cancer (<xref ref-type="bibr" rid="B11">11</xref>). Moreover, unsupervised analysis of breast tumor samples using both expression and methylation (MET) profiles discovered two novel subtypes with distinct genetic and epigenetic patterns in the luminal-A subgroup (<xref ref-type="bibr" rid="B12">12</xref>). The correlativity between data from three omics layers (CNV, MET, and mRNA) were combined to stratify BRCA patients and two biologically distinct subgroups were determined (<xref ref-type="bibr" rid="B13">13</xref>). It is evident that the correlation between different omics has played a major role in the development of breast cancer subtypes, but there is still a need for more research to focus on the relationship between the genome and transcriptome and how it can be used for cancer typing.</p>
<p>Thus, we have proposed a novel method, called GDTEC (Genome-Driven Transcriptome), based on the driving relationship between genome and transcriptome (denoted as GDTEC) to identify breast cancer subtypes and a hybrid breast cancer subtype with extremely poor survival prognosis was identified from the TCGA-BRCA cohort. Differences in the clinical phenotype, tumor microenvironment, biological function, cell state, and cell-cell communication were identified for this subtype patients. Patients with the hybrid subtype were also found to be more mixed in histological classification and more sensitive to targeted therapy. Subsequently, we identified 31 biomarkers that were used to construct prognostic risk models and subtype classifiers for patients with the hybrid subtype at the multi-omics level and at the gene expression level with significant results. The generalization ability of these four prognostic risk models and subtype classifiers was validated in four external datasets obtained from the GEO database, indicating that these biomarkers have reliable therapeutic and prognostic significance for the hybrid subtype of breast cancer. See <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figure&#xa0;5</bold>
</xref> for the workflow.</p>
<p>In conclusion, our study identified a new hybrid breast cancer subtype with extremely poor survival prognosis and its biomarkers, which provides a new reference for molecular typing studies and clinical precision treatment of breast cancer.</p>
</sec>
<sec id="s2" sec-type="results">
<label>2</label>
<title>Results</title>
<sec id="s2_1">
<label>2.1</label>
<title>GDTEC-based stratification of breast cancer</title>
<p>To reveal the heterogeneity of breast cancer patients and obtain robust clustering results. Three factors were considered: 1) The selection of different LFC thresholds. 2) A multi-level LFC-based score assignment. 3) Different clustering methods and distance measures. The results showed that the GDTEC matrix and clustering results were robust and consistent across different LFC thresholds (<xref ref-type="fig" rid="f1">
<bold>Figures&#xa0;1A, B</bold>
</xref>). The clustering results obtained after multi-level LFC-based score assignment were found to have no higher resolution (<xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1C</bold>
</xref>). It was found that approximately 93.2% of all the clustering results had an overlap ratio of 0.8 using different methods and measures (<xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1D</bold>
</xref>), and the clustering results were consistent and robust. Finally, we chose LFC &#x2208; (-1, 1) as the threshold to create a GDTEC fusion matrix containing 299 subtype-specific genes for 721 BRCA patients and used the R package &#x2018;ConsensusClusterPlus&#x2019; for molecular subtype identification. We found that k=4 was the inflection point for all results (<xref ref-type="supplementary-material" rid="SM1">
<bold>Figure S1</bold>
</xref>). The clarity of the classification of the 23 clustering results at k=4 was observed and the results of the pam-binary were considered as the final result of clustering (<xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1E</bold>
</xref>), which proved that four breast cancer subtypes were identified based on the characteristics of GDTEC. Then, a significant difference in overall survival time (OS) was discovered among the patients of four subtypes by using Kaplan-Meier and log-rank test, with the patients of subtype 4 having a significantly worse overall survival than the patients of the other subtypes (<xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1E</bold>
</xref>, Log-rank, p = 0.0082). Hierarchical clustering of the 299 subtype-specific genes used for subtyping revealed that the signature genes were clearly clustered into four clusters and had different levels of GDTEC expression in the four breast cancer subtypes. Notably, almost all genes were characterized by GDTEC expression in subtype 4 with the poorest survival (<xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1F</bold>
</xref>). We also investigated the number of genes with GDTEC expression among 14,749 genes in patients with the four breast cancer subtypes and showed that the patients having the best survival prognosis in subtype 1 had fewer genes with GDTEC expression, while the patients with the poorest survival prognosis in subtype 4 had the most genes with GDTEC expression (<xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1G</bold>
</xref>). Therefore, we speculated that the poorer survival prognosis of patients may be related to the fact that they have a higher number of genes with GDTEC expression.</p>
<fig id="f1" position="float">
<label>Figure&#xa0;1</label>
<caption>
<p>
<bold>(A)</bold> The overlap of GDTEC matrices generated under different LFCs. <bold>(B)</bold> Overlap rate of patients in the clustering results obtained based on different LFCs. <bold>(C)</bold> Overlap of patients in the clustering results obtained based on multilevel LFC score assignment. <bold>(D)</bold> The coincidence rate of the patients among the clustering results. <bold>(E)</bold> Kaplan-Meier curves of the overall survival (OS) among the four subtypes in the TCGA cohort. <bold>(F)</bold> Hierarchical clustering heat map of 299 genes with GDTEC features (&#x2018;1&#x2019; indicates GDTEC expression, and &#x2018;0&#x2019; indicates no GDTEC expression). <bold>(G)</bold> The number of genes with GDTEC features in the four subtypes, out of 14,749 genes in the multi-omics fusion dataset.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-13-1130092-g001.tif"/>
</fig>
</sec>
<sec id="s2_2">
<label>2.2</label>
<title>GDTEC-based subtypes show significant distinct phenotypic and clinical features</title>
<p>To reveal the differences in clinical phenotypes among these four subtypes of breast cancer patients, we calculated the percentage of PAM50 (Prediction Analysis of Microarray 50) classification in each subtype and found that subtype 1 was predominantly composed by Luminal A (88.60%), defined as the LumA-dominant subtype (denoted as Dom_A). Subtype 2 was predominantly composed of both Luminal A (65.60%), and Luminal B (18. 80%), defined as the LumA- and LumB-dominant subtype (denoted as Dom_A&amp;B). Subtype 3 was mainly Basal-like (53%), defined as the Basal-like dominant subtype (denoted as Dom_Basal). Subtype 4 with the worst prognosis is not easily classified as any of the known subtypes, but rather is a unique hybrid subtype, denoted as Mix_Sub, which contains a mixture of different subtypes, including 34.40% Luminal A, 38.40% Luminal B, 16% Her2, and 11.20% Basal-like (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2A</bold>
</xref>). Then, the Mix_Sub subtype was characterized by a more dispersed age distribution compared to other subtypes, as evidenced by the folded graphs of the age proportions of patients (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2B</bold>
</xref>). Additionally, an analysis of the expression levels of Her2, estrogen receptor (Er), and progesterone receptor (Pr) of breast cancer patients showed that the Mix_Sub subtype was also marked by confusion in hormone levels in comparison to the other subtypes (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2C</bold>
</xref>). Subsequently, we observed that patients with the Mix_Sub subtype received the expected treatment according to the distribution of PAM50 subtypes in this subtype (80% of patients received treatment: 20% received combination therapy, and 60% received monotherapy). However, their worst survival prognosis suggested that they may need to be treated with increased treatment modalities and given more attention at the time of treatment (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2D</bold>
</xref>). In conclusion, the above results suggested that the discovery of the Mix_Sub subtype could improve the reference information for clinicians in the diagnosis and treatment of breast cancer patients.</p>
<fig id="f2" position="float">
<label>Figure&#xa0;2</label>
<caption>
<p>
<bold>(A)</bold> The proportion of the existing PAM50 subtypes among the four breast cancer subtypes. <bold>(B)</bold> The distribution of the four breast cancer subtypes in different age ranges. <bold>(C)</bold> The status of Her2, Er, Pr in patients with four breast cancer subtypes. N means negative; P means positive. <bold>(D)</bold> The status of patients with four breast cancer subtypes received pharmaceutical or radiation therapy. YY means receiving two treatments; NN means not receiving any treatments; Monotherapy means receiving either of these two treatments.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-13-1130092-g002.tif"/>
</fig>
</sec>
<sec id="s2_3">
<label>2.3</label>
<title>Multiple biological functions associated with breast cancer are altered in the Mix_Sub subtype</title>
<p>Altered biological function plays an important role in the development and progression of cancer (<xref ref-type="bibr" rid="B14">14</xref>). Therefore, we performed Gene Ontology (GO) enrichment analysis of subtype-specific genes to investigate the altered biological processes in patients of each subtype with GDTEC expression using the &#x2018;ClusterProfiler&#x2019; package. It was found that patients with the Mix_Sub subtype exhibited significant alterations in a large number of biological processes (BPs), while the other three subtypes only showed partial alterations. The 97 significantly altered biological processes in patients with the four subtypes are shown in <xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3A</bold>
</xref>. We delved deeper into the biological changes that are unique to each subtype of breast cancer and the results indicated that patients with the Dom_A, Dom_A&amp;B, or Dom_Basal subtypes showed changes in biological processes that are crucial in the development of breast cancer. These processes include mammary gland epithelial cell proliferation and development, cell-cell adhesion, macrophage and glial cell proliferation, neuron cellular homeostasis, cell motility, migration, and differentiation, and regulation of ERK1 and ERK2 cascade (<xref ref-type="bibr" rid="B15">15</xref>&#x2013;<xref ref-type="bibr" rid="B17">17</xref>). Notably, all these biological processes were altered in patients with Mix_Sub subtype (<xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3B</bold>
</xref>). Overall, our analysis revealed that a large number of biological processes were altered in patients with the Mix_Sub subtype and the combined impact of these alterations could potentially be a significant contributor to the unfavorable survival prognosis observed in patients with the Mix_Sub subtype.</p>
<fig id="f3" position="float">
<label>Figure&#xa0;3</label>
<caption>
<p>
<bold>(A)</bold> Sankey diagram showing the relationship between the 97 significantly altered biological processes and patients with four subtypes. <bold>(B)</bold> Representative biological processes that are altered in patients with 4 breast cancer subtypes.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-13-1130092-g003.tif"/>
</fig>
</sec>
<sec id="s2_4">
<label>2.4</label>
<title>Mix_Sub subtype patients with complex tumor microenvironment are expected to be more suitable for targeted therapy</title>
<p>Tumor microenvironment (TME) is closely related to cancer prognosis and therapeutic efficacy (<xref ref-type="bibr" rid="B18">18</xref>, <xref ref-type="bibr" rid="B19">19</xref>). Consequently, we compared the differences in tumor microenvironment between patients with the Mix_Sub subtype and other subtypes. The results showed that patients with the Mix_Sub subtype had significantly lower immune cell infiltration, especially including B cells, dendritic cells, and endothelial cells, compared to other subtypes (<xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4A</bold>
</xref>, Kruskal-Wallis test, p = 0.00078, 0.0029, 2.4e-05). The immune signature scores also indicated a lower level of immune cell infiltration in patients with the Mix_Sub subtype (<xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4B</bold>
</xref>). T cells are an important component of human immune function. Gene set variation analysis (GSVA) of 416 T cell disorders genes revealed higher T-cell dysfunction and lower T-cell elimination in patients with the Mix_Sub subtype, which explains the poorer immune response in patients with the Mix_Sub subtype from a perspective of T cells (<xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4C</bold>
</xref>). Moreover, the average expression of 154 T-cell inflammatory genes also indicated a lower inflammatory response in patients with this subtype (<xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4D</bold>
</xref>). The tumor stemness score index can be used to evaluate the malignancy of the tumor. We found that the tumor stemness score increased with decreasing survival in patients of each subtype, and the tumor stemness score of patients with the Mix_Sub subtype was only lower than that of patients with the Dom_Basal subtype (<xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4E</bold>
</xref>). Collectively, our results demonstrated that patients with the Mix_Sub subtype have higher T-cell disorders and lower immune cell infiltration, inflammatory response, and tumor malignancy, which may contribute to the worst survival rate in patients with this subtype.</p>
<fig id="f4" position="float">
<label>Figure&#xa0;4</label>
<caption>
<p>
<bold>(A)</bold> Immune infiltration level score based on the MCP-counter method (Kruskal-Wallis test, &#x2018;*&#x2019;p &lt; 0.05, &#x2018;**&#x2019;p &lt; 0.005, &#x2018;***&#x2019;p &lt; 0.0005, &#x2018;****&#x2019;p &lt; 0.00005).. <bold>(B)</bold> Immune signature scores, based on the Dom_A subtype, and relative scores of other subtypes. <bold>(C)</bold> GSVA enrichment scores for genes associated with T-cell disorders. <bold>(D)</bold> Expression of T-cell inflammatory genes. <bold>(E)</bold> Cancer stemness cell score.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-13-1130092-g004.tif"/>
</fig>
<p>Next, we investigated the proportion of the 12 consensus groups in the histological classification of TCGA-BRCA proposed in the literature (<xref ref-type="bibr" rid="B20">20</xref>) across the four subtypes and found that the Mix_Sub subtype was mainly composed of five consensus groups homogeneously (32.70% IDC-LumB, 22.20% IDC-LumA, 15.30% IDC-Basal, 13.30% ILC-Luminal, 9.70% IDC-Her2E), while the other three subtypes consisted mainly of two or three consensus groups (Dom_A: 59.60% IDC-LumA and 21.90% ILC-Luminal, Dom-A&amp;B: 52.20% IDC-LumA and 17.20% IDC-LumB, Dom_Basal: 51.50% IDC-Basal, 14.40% IDC-Her2E and 10.30% IDC-LumB) (<xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5A</bold>
</xref>). This result indicated that the Mix_Sub subtype is confusing even from a histological point of view. Pathological sections of individual cases from these 12 consensus groups in the TCGA database are presented here (<xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5B</bold>
</xref>).</p>
<fig id="f5" position="float">
<label>Figure&#xa0;5</label>
<caption>
<p>
<bold>(A)</bold> Distribution of the 12 consensus groups previously reported for TCGA-BRCA in 4 subtypes. <bold>(B)</bold> Pathological sections of 12 consensus groups classified according to a combination of molecular and histological features. <bold>(C)</bold> Mutation load of seven targeted therapeutic genes associated with breast cancer treatment from the literature (Wilcoxon-test, '***'p &lt; 0.005, '****'p &lt; 0.001). <bold>(D)</bold> Common mutations in 7 target genes. <bold>(E)</bold> Lines of the same color connect genes that are simultaneously mutated only in patients with the Mix_Sub subtype. <bold>(F)</bold> Drug susceptibility prediction for gene mutation (&#x2018;yes&#x2019; is the mutant group, &#x2018;no&#x2019; is the unmutated group). Student's t-test, '*'p &lt; 0.05, '***'p &lt; 0.005, '****'p &lt; 0.001</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-13-1130092-g005.tif"/>
</fig>
<p>Recently, several breast cancer-targeted therapeutic genes have been identified in published studies (<xref ref-type="bibr" rid="B21">21</xref>&#x2013;<xref ref-type="bibr" rid="B23">23</xref>). We found that genomic variation in these genes increased with decreasing survival in patients with subtypes, being highest in patients with Mix_Sub subtype (<xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5C</bold>
</xref>, EGFR: 12.46% ~ ERBB2: 31.65%). Particularly, the highest percentage of patients with simultaneous genomic variants in at least two genes was observed in patients with the Mix_Sub subtype (<xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5D</bold>
</xref>). Moreover, some combinations of these genes showed concurrent genomic variants only in patients of this subtype (<xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5E</bold>
</xref>). The drug sensitivity of these targeted therapeutic genes was explored in 49 cell lines based on the drug treatment data provided by the GDSC database. The results demonstrated that breast cancer patients with EGFR mutation (Student&#x2019;s t-test: erlotinib, p = 0.0018; sapitinib, p = 0.0042; lapatinib, p = 0.015) and ERBB2 mutation (Student&#x2019;s t-test: lapatinib, p &lt; 2.22e-16; afatinib, p = 2.3e-2; sapitinib, p = 1.1e-3) had better sensitivity to targeted drugs (<xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5F</bold>
</xref>). Therefore, we anticipated that combination therapy with multiple targeted agents may be a better approach to treating patients with this subtype.</p>
</sec>
<sec id="s2_5">
<label>2.5</label>
<title>Mix_Sub subtype shows significant cell state upregulation in Cell cycle, DNA damage and DNA repair</title>
<p>The functional states of cancer cells are strongly linked to the development and progression of cancer (<xref ref-type="bibr" rid="B24">24</xref>). By calculating the GSVA enrichment scores of 14 cancer-related cell states for each patient, we observed significant variations in cell states among patients with different subtypes (<xref ref-type="fig" rid="f6">
<bold>Figures&#xa0;6A, C</bold>
</xref>). In particular, patients with the Mix_Sub subtype showed significant upregulation in cell cycle, DNA damage, and DNA repair compared to the patients with the other subtypes (<xref ref-type="fig" rid="f6">
<bold>Figures&#xa0;6A&#x2013;C</bold>
</xref>). To gain further insight, we identified 13 differentially expressed genes in the Mix_Sub subtype patients compared to non-Mix_Sub subtype patients, based on a logFC &gt;= 0.58 and FDR &lt; 0.05. Further, We performed a GO enrichment analysis for these differentially expressed genes and all genes involved in these three cell states. Subsequently, mapping the biological functions enriched by these two sets of genes, it was found that the biological functions enriched by the differentially expressed genes were clustered in those enriched by all genes (<xref ref-type="supplementary-material" rid="SM1">
<bold>Figure S2</bold>
</xref>). Specifically, the differentially expressed genes for these three cell states and the nine most significant biological functions in which they are involved are shown here (<xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6D</bold>
</xref>). We suspected that the upregulation in these characteristic genes led to alterations in relevant biological functions, further leading to disruption of the normal regulation of cell states and ultimately, resulting in a poor survival outcome for patients with the Mix_Sub subtype.</p>
<fig id="f6" position="float">
<label>Figure&#xa0;6</label>
<caption>
<p>
<bold>(A)</bold> The mean values of GSVA enrichment scores of 14 cell states in 4 breast cancer subtypes. <bold>(B)</bold> GSVA scores in the three specific cell states in 4 breast cancer molecular subtypes (Wilcoxon-test, '**'p &lt; 0.01, '***'p &lt; 0.001, '****'p &lt; 0.0001). <bold>(C)</bold> GSVA scores of cell states for each patient in Mix_Sub and non-Mix_Sub subtypes. <bold>(D)</bold> The main biological functions involved the differentially expressed genes of the three specific cell states. Top left: Cell cycle-specific pathways. Middle and lower: DNA damage specific pathways. Upper right: DNA repair specific pathways. <bold>(E)</bold> DNA damage footprint analysis.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-13-1130092-g006.tif"/>
</fig>
<p>Numerous studies have confirmed that homologous recombination deficiency (HRD) is a common feature of many tumors that accelerates carcinogenesis through increasing genomic instability, which has been widely documented in cancers such as breast cancer and has become a valuable biomarker (<xref ref-type="bibr" rid="B25">25</xref>, <xref ref-type="bibr" rid="B26">26</xref>). We found that HRD scores in patients with the Mix_Sub subtype were only lower than in patients with the triple-negative breast cancer-enriched Dom_Basal subtype, suggesting that HRD is also one of the factors contributing to the poor survival outcome in patients with the Mix_Sub subtype (<xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6E</bold>
</xref>).</p>
</sec>
<sec id="s2_6">
<label>2.6</label>
<title>Mix_Sub subtype exhibits distinct cell-cell communications</title>
<p>Cell&#x2013;cell communication mediated by ligands&#x2013;receptors is essential for the proper functioning of multicellular organisms (<xref ref-type="bibr" rid="B27">27</xref>). We investigated the expression of 1216 ligands and receptors, as well as 32 subtype-specific ligands and receptors, in patients with the Mix_Sub subtype of breast cancer. It revealed a higher proportion of GDTEC expression in Mix_Sub subtype patients compared to non-Mix_Sub subtype patients (<xref ref-type="fig" rid="f7">
<bold>Figure&#xa0;7A</bold>
</xref>, t-test, p &lt; 2.22e-16; <xref ref-type="fig" rid="f7">
<bold>Figure&#xa0;7B</bold>
</xref>, t-test, p &lt; 2.22e-16). Among these ligands and receptors, the differential ligand NCAM1 and receptors WNT5A and GNAI2 with a high percentage of GDTEC expression in Mix_Sub subtype patients (percentage of patients &gt;= 0.7) and a low percentage of GDTEC expression in non-Mix_Sub subtype patients (percentage of patients &lt;= 0.3) were screened and their GDTEC expression is shown in <xref ref-type="fig" rid="f7">
<bold>Figure&#xa0;7E</bold>
</xref>. Numerous studies have confirmed the association of the three ligands and receptors with the development and progression of breast cancer (<xref ref-type="bibr" rid="B28">28</xref>, <xref ref-type="bibr" rid="B29">29</xref>) (<xref ref-type="fig" rid="f7">
<bold>Figure&#xa0;7C</bold>
</xref>). Specifically, these three ligands and receptors had a higher proportion of patients with GDTEC expression and lower mRNA expression in the Mix_Sub subtype, while the opposite trend was observed in the non-Mix_Sub subtype, reflecting transcriptome expression was driven by genomic variation (<xref ref-type="fig" rid="f7">
<bold>Figure&#xa0;7D</bold>
</xref>). Next, correlation analysis based on the expression of these three specific ligands and receptors revealed that only NCAM1 had a high correlation with its corresponding receptor (Spearman correlation coefficient &gt;= 0.2, P&lt;0.05) (<xref ref-type="fig" rid="f7">
<bold>Figure&#xa0;7G</bold>
</xref>). Additionally, NCAM1 was mapped into the human protein interaction network, and protein-protein interactions interconnected with NCAM1 were screened according to the same criteria (<xref ref-type="fig" rid="f7">
<bold>Figure&#xa0;7G</bold>
</xref>). To our surprise, NCAM1- FGFR1 interaction was identified in both networks, and many studies had proved that this interaction was associated with many cancers (<xref ref-type="bibr" rid="B30">30</xref>). Furthermore, abundant research has demonstrated that the identified FGF family and its related ligands, receptors and locked proteins, are all closely associated with the development of breast cancer (<xref ref-type="bibr" rid="B31">31</xref>).</p>
<fig id="f7" position="float">
<label>Figure&#xa0;7</label>
<caption>
<p>
<bold>(A, B)</bold> Number of genes expressing GDTEC in 1216 and 32 subtype-specific ligands and receptors in patients with different subtypes. <bold>(C)</bold> The ligand-receptor pairs of NCAM1, WNT5A and GNAI2 with high proportion of GDTEC expression in Mix_Sub subtype patients. <bold>(D)</bold> GDTEC expression and mRNA expression of NCAM1, WNT5A and GNAI2 in patients with Mix_Sub subtype and non-Mix_Sub subtype. <bold>(E)</bold> Ratio of patients with GDTEC expression of NCAM1, WNT5A and GNAI2 in Mix_Sub subtype and non-Mix_Sub subtype patients. <bold>(F)</bold> Copy number deletion of NCAM1 in patients. <bold>(G)</bold> NCAM1 ligand-receptor pairs and protein-protein interactions related to breast cancer. <bold>(H)</bold> Diagram of the cell-cell communication mechanism mediated by NCAM1-FGFR1 (Symbol 1: Cis-homophilic interactions of an NCAM1 molecule. Symbol 2: Trans-homophilic interactions between NCAM molecules on different cell membranes. Symbol 3: Interactions between NCAM1 and FGFR1).</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-13-1130092-g007.tif"/>
</fig>
<p>Meanwhile, we found that a significant copy number deletion and reduced mRNA expression of NCAM1 in most patients with the Mix_Sub subtype and the reduction in NCAM1 expression appears to be the result of the cis-regulatory effect of genomic copy number changes on transcriptome expression (<xref ref-type="fig" rid="f7">
<bold>Figure&#xa0;7F</bold>
</xref>). We also identified a mechanism of interaction between NCAM1 and FGFR1, as depicted in <xref ref-type="fig" rid="f7">
<bold>Figure&#xa0;7H</bold>
</xref> (<xref ref-type="bibr" rid="B30">30</xref>, <xref ref-type="bibr" rid="B32">32</xref>&#x2013;<xref ref-type="bibr" rid="B37">37</xref>). Overall, our analysis suggests that the low expression of NCAM1 in Mix_Sub subtype patients is likely caused by the large number of copy number deletions, which restrict its binding to FGFR1, resulting in the inability of various downstream signaling pathways to be activated, which in turn led to tumor deterioration and ultimately to poorer survival outcomes for Mix_Sub subtype patients.</p>
</sec>
<sec id="s2_7">
<label>2.7</label>
<title>Risk model constructed by subtype-specific genes can accurately predict prognosis of patients</title>
<p>To investigate the potential impact of subtype-specific genes on patient survival prognosis. Based on the GDTEC matrix, two prognostic genes, F11R (HR = 2.037, Log-rank, p = 0.0032) and NDRG4 (HR = 1.700, Log-rank, p = 0.0286) were identified from 299 subtype-specific genes using univariate and multivariate Cox proportional hazards models. A prognostic risk model was developed based on these genes, which calculated a risk score for each patient and divided them into high-risk and low-risk groups based on the median risk scor (<xref ref-type="fig" rid="f8">
<bold>Figure&#xa0;8A</bold>
</xref>). The results indicated that patients in the high-risk group had a significantly lower survival rate than the low-risk group (Log-rank, p = 0.01, <xref ref-type="fig" rid="f8">
<bold>Figure&#xa0;8B</bold>
</xref>), and there were more deaths in the high-risk group (<xref ref-type="fig" rid="f8">
<bold>Figure&#xa0;8D</bold>
</xref>). Meanwhile, patients were divided into three groups according to whether these two risk genes expressed GDTEC or not, and a significant difference in survival prognosis was found among the three groups (Log-rank, p = 0.001), and the more GDTEC expression of these two risk genes in patients, the worse the survival rate (<xref ref-type="fig" rid="f8">
<bold>Figure&#xa0;8C</bold>
</xref>). Moreover, GO annotation and enrichment analysis of these two risk genes showed that F11R was mainly involved in T cell extravasation and establishment of the endothelial intestinal barrier, NDRG4 was mainly involved in the regulation of endocytic recycling and negative regulation of platelet-derived growth factor receptor signaling pathway, and the two genes were jointly involved in response to radiation. These functional pathways were closely related to the occurrence and development of breast cancer, and can potentially be used as biomarkers for the disease (<xref ref-type="bibr" rid="B38">38</xref>, <xref ref-type="bibr" rid="B39">39</xref>). Collectively, the prognostic risk model constructed using subtype-specific genes has good predictive efficacy for patient survival prognosis.</p>
<fig id="f8" position="float">
<label>Figure&#xa0;8</label>
<caption>
<p>
<bold>(A)</bold> Multivariate cox regression model constructed with the GDTEC expression of NDRG4 and F11R as features. The hazard ratios are shown with 95% confidence intervals (Wald test, '*'p &lt; 0.05, '**'p &lt; 0.01). <bold>(B)</bold> Kaplan-Meier survival chart of low-risk and high-risk breast cancer patients. <bold>(C)</bold> Kaplan-Meier survival chart of the three groups of breast cancer patients were grouped according to whether the two risk genes, F11R and NDRG4, express GDTEC. F_N = 0 indicates that both genes do not express GDTEC; F_N = 1 indicates that one of the genes expresses GDTEC; F_N = 2 indicates that both genes express GDTEC. <bold>(D)</bold> Risk score ranking of patients and their survival status, as well as the risk scores of patients corresponding to the number of genes expressing GDTEC in their 2 risk genes. <bold>(E)</bold> Functions of F11R and NDRG4 two risk genes involved. Pink triangles represent genes and pink circles represent GO functional pathways.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-13-1130092-g008.tif"/>
</fig>
</sec>
<sec id="s2_8">
<label>2.8</label>
<title>Novel mix_Sub subtype and prognostic classifiers were constructed at the mRNA level based on multi-omics-identified biomarkers</title>
<p>Due to poor survival and the uniqueness of patients with the Mix_Sub subtype, accurate diagnosis of patients with the Mix_Sub subtype before clinical treatment is beneficial to the cure of patients. A classifier for the Mix_Sub subtype was constructed by random forest method using GDTEC expression of 31 subtype-specific genes as features. The classifier was able to accurately identify the subtypes of patients in both the training and test datasets, with an accuracy of 0.73 and an AUC of 0.806 (<xref ref-type="supplementary-material" rid="SM1">
<bold>Figures S3</bold>
</xref>, <xref ref-type="fig" rid="f9">
<bold>9A</bold>
</xref>). The generalization ability of the classifier was further validated using an independent dataset of 1981 breast cancer patients with CNV downloaded from the cBioPortal database, achieving an accuracy of 0.89 and an AUC of 0.972 (<xref ref-type="fig" rid="f9">
<bold>Figures&#xa0;9B, C</bold>
</xref>, a significant survival difference: Log-rank, p = 0.00073). Additionally, GO enrichment analysis showed that the 31 marker genes were predominantly related to the regulation of macro autophagy, gland development, regulation of membrane permeability, and platelet-derived growth factor receptor signaling pathway, etc. (<xref ref-type="fig" rid="f9">
<bold>Figure&#xa0;9D</bold>
</xref>, Hypergeometric test, p &lt; 0.05). Overall, all these pathways are strongly associated with the development of breast cancer and have been confirmed by numerous studies (<xref ref-type="bibr" rid="B40">40</xref>, <xref ref-type="bibr" rid="B41">41</xref>), reflecting the accuracy of the identified biomarkers.</p>
<fig id="f9" position="float">
<label>Figure&#xa0;9</label>
<caption>
<p>
<bold>(A)</bold> ROC curves of classifiers constructed based on 31 marker genes. <bold>(B, C)</bold> ROC curves and Kaplan-Meier survival plots for validation of the Mix_Sub subtype classifier using external breast cancer data. <bold>(D)</bold> GO enrichment analysis of 31 marker genes. <bold>(E)</bold> Gini coefficient for 31 characteristics. <bold>(F)</bold> ROC curves of classifiers constructed based on expression fold changes of 18 marker genes. <bold>(G)</bold> Kaplan-Meier survival curve of K-nearest neighbor (KNN) classification results for the GSE42568 dataset. <bold>(H, I)</bold> Using the grouped GSE42568 dataset, the ROC curves for validating the broad applicability of the Mix_Sub subtype classifier and Kaplan-Meier survival curve for classification results.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-13-1130092-g009.tif"/>
</fig>
<p>As gene expression data is abundant and readily available, we selected eighteen genes with the top importance as candidates based on the Gini coefficients (MeanDecreaseGini &gt; 5.95) from 31 biomarker genes identified by GDTEC features (<xref ref-type="fig" rid="f9">
<bold>Figure&#xa0;9E</bold>
</xref>), and their gene expression profiles were used to construct a subtype classifier and prognostic risk model for the Mix_Sub subtype. The AUC of this subtype classifier was 0.737 (<xref ref-type="fig" rid="f9">
<bold>Figure&#xa0;9F</bold>
</xref>), and its generalization ability was validated in another independent dataset, GSE42568, (<xref ref-type="fig" rid="f9">
<bold>Figures&#xa0;9G&#x2013;I</bold>
</xref>, AUC = 0.948; Log-rank, p = 0.0036). Then Cox proportional-hazards model was used to evaluate the effect of abnormal expression of these 18 marker genes on patient survival prognosis. A prognostic risk model, characterized by abnormal expression of F11R and MAF, was constructed using multivariate cox regression analysis (<xref ref-type="fig" rid="f10">
<bold>Figure&#xa0;10A</bold>
</xref>, F11R: HR = 1.66, p = 0.0261; MAF: HR = 1.66, p = 0.0281). The risk score was calculated for each patient, dividing them into low-risk and high-risk groups according to the median risk score. The high-risk group showed a significantly worse survival rate compared to the low-risk group (<xref ref-type="fig" rid="f10">
<bold>Figures&#xa0;10B, C</bold>
</xref>, Log-rank, p = 0.027). Furthermore, patients were grouped according to the number of abnormally expressed genes in F11R and MAF, and it was found that the higher the number of abnormally expressed genes in patients, the worse the survival rate (<xref ref-type="fig" rid="f10">
<bold>Figure&#xa0;10D</bold>
</xref>, Log-rank, p = 0.0071). The accuracy and generalization of the prognostic risk model were validated in the external datasets GSE61304, GSE31448, and GSE42568 (<xref ref-type="fig" rid="f10">
<bold>Figures&#xa0;10E&#x2013;G</bold>
</xref>, GSE61304: Log-rank, p = 0.036, Log-rank, p = 0.043; GSE31448: Log-rank, p = 0.037; GSE42568: Log-rank, p = 0.11). Interestingly, by investigating the alterations in the genome of F11R and MAF, we found that they underwent copy number variation in the vast majority of patients (<xref ref-type="fig" rid="f10">
<bold>Figure&#xa0;10H</bold>
</xref>). Notably, F11R was a higher risk factor not only at the gene expression level (<xref ref-type="fig" rid="f10">
<bold>Figure&#xa0;10A</bold>
</xref>, HR = 1.66, p = 0.0261) but also at the GDTEC expression level (<xref ref-type="fig" rid="f8">
<bold>Figure&#xa0;8A</bold>
</xref>, HR = 2.037, p = 0.0032), reflecting the reliability of the identified risk factors (<xref ref-type="fig" rid="f10">
<bold>Figure&#xa0;10I</bold>
</xref>).</p>
<fig id="f10" position="float">
<label>Figure&#xa0;10</label>
<caption>
<p>
<bold>(A)</bold> Multivariate cox regression model constructed with the LFC of F11R and MAF as features. <bold>(B)</bold> The Kaplan-Meier survival curve for classifying the high and low risks of the TCGA-BRCA samples was constructed by F11R and MAF. <bold>(C)</bold> Survival status of patients in the high risk and low risk groups. <bold>(D)</bold> The Kaplan-Meier survival curvet of the three groups of breast cancer patients is grouped according to the LFC of the two risk genes, F11R and MAF. F_M = 0, indicating that both genes were normally expressed. F_M = 1, indicating that one gene was abnormally expressed. F_M = 2, indicating that both genes were abnormally expressed. <bold>(E&#x2013;G)</bold> Kaplan-Meier survival curve of patients in the high-risk and low-risk groups using the GSE61304, GSE31448, and GSE42568 datasets to validate the constructed risk-prognosis models. <bold>(H)</bold> The copy number variation of F11R and MAF in each sample. <bold>(I)</bold> Risk prognostic factors identified at two levels. <bold>(J)</bold> Spatial variability of MAF, F11R and NDRG4 in typical samples, and the landscape of more samples was displayed in S4. <bold>(K)</bold> Normalized spatial gene expression of MAF in three representative samples and annotated cell types. <bold>(L)</bold> Univariate and multivariate analysis of the FM_risk scores with other standard clinical features in the breast cancer.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-13-1130092-g010.tif"/>
</fig>
<p>Next, the spatial variability of three risk prognostic markers (NDRG4, F11R, MAF) was evaluated in different cell types using spatial transcriptomic data from the SOAR database. The results indicated a significant pattern of spatial expression changes mainly in malignant cells, suggesting that these markers may play a crucial role in the development of malignant cells (<xref ref-type="fig" rid="f10">
<bold>Figure&#xa0;10J</bold>
</xref>, <xref ref-type="supplementary-material" rid="SM1">
<bold>S4</bold>
</xref>). Moreover, the spatial expression and variability of MAF in three patients were analyzed, revealing significant spatial variation in malignant cells (<xref ref-type="fig" rid="f10">
<bold>Figure&#xa0;10K</bold>
</xref>). Finally, we assessed whether the risk scores (FM_risk) obtained by patients based on this prognostic model were independent of other clinical or pathological factors and found that the FM_risk maintained a significantly independent correlation with survival even after adjusting other standard clinical features in the breast cancer analysis (<xref ref-type="fig" rid="f10">
<bold>Figure&#xa0;10L</bold>
</xref>, Univariate cox: HR = 1.66, p = 0.0288; Multivariate cox: HR = 2.085, p = 0.0051).</p>
<p>In conclusion, these results illustrated the accuracy and generalization ability of the biomarkers identified by genes&#x2019; GDTEC features.</p>
</sec>
</sec>
<sec id="s3" sec-type="materials|methods">
<label>3</label>
<title>Materials and methods</title>
<sec id="s3_1">
<label>3.1</label>
<title>TCGA datasets and pre-processing</title>
<p>Clinical data, somatic mutation data, and gene expression data (mRNA count-UQ and mRNA FPKM-UQ) for TCGA-BRCA samples were obtained from the TCGA database (<ext-link ext-link-type="uri" xlink:href="https://portal.gdc.cancer.gov/">https://portal.gdc.cancer.gov/</ext-link>), including 778 disease samples and 100 normal samples. A new mutation dataset (post-SNV dataset) and a gene expression change profile for each patient (post-RNAseq dataset) were obtained after preprocessing. Copy number variation (CNV) data for TCGA-BRCA samples were obtained from the UCSC Xena (<ext-link ext-link-type="uri" xlink:href="https://xenabrowser.net/">https://xenabrowser.net/</ext-link>) database. A new copy number variation matrix (post-CNV dataset) was obtained after preprocessing. Details of the data pre-processing can be found in <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Material 1</bold>
</xref>.</p>
</sec>
<sec id="s3_2">
<label>3.2</label>
<title>Construction of multi-omics fusion matrix (GDTEC matrix)</title>
<p>The three pre-processed datasets (post-SNV, CNV, and RNAseq) were combined to form a fusion matrix (GDTEC matrix) of genomic variation-driven transcriptome expression in breast cancer. The gene values from the post-CNV and post-RNAseq datasets were summed, with values of 1 and -1 marked as 0 (expressions not driven by CNV) and values of 2 and -2 marked as 1 (expressions driven by CNV), resulting in the CNV-RNAseq consistency matrix. The value -1 in the post-RNAseq dataset was also marked as 1 to obtain the post2-RNAseq dataset. The gene values from the post-SNV and post2-RNAseq datasets were then summed, with values of 1 marked as 0 (expressions not driven by mutation) and values of 2 marked as 1 (expressions driven by mutation), resulting in the SNV-RNAseq consistency matrix. The CNV-RNAseq and SNV-RNAseq datasets were summed, and values of 2 were marked as 0, as both somatic mutations and copy number variations affecting transcriptome expression are rare. Finally, the genes in the GDTEC matrix with expression levels of 0 in more than 60% of the samples were removed, leaving 299 genes for the identification of breast cancer subtypes.</p>
</sec>
<sec id="s3_3">
<label>3.3</label>
<title>External validation data</title>
<p>We downloaded GSE42568, GSE61304, and GSE31448 data of GPL570 platform from Gene Expression Omnibus (GEO) database as external validation datasets (<ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/geo/">https://www.ncbi.nlm.nih.gov/geo/</ext-link>). These datasets all contain normal samples.</p>
<p>Copy number variation data and clinical survival data of 1981 breast cancer patients were downloaded from cBioPortal database (<ext-link ext-link-type="uri" xlink:href="https://www.cbioportal.org/">https://www.cbioportal.org/</ext-link>) as external validation datasets to verify the generalization ability of the classifier. Patients were grouped according to the occurrence of CNV in the marker genes used to construct the classifier. A patient was defined as a patient of Mix_Sub subtype if more than 80% (&gt;80%) of these marker genes had CNV, otherwise as a patient with non-Mix_Sub subtype.</p>
</sec>
<sec id="s3_4">
<label>3.4</label>
<title>Data related to tumor microenvironment analysis</title>
<p>Immune signature score data was downloaded from the literature (<xref ref-type="bibr" rid="B42">42</xref>) for 11,080 patients in the TCGA. 160 genes associated with T-cell inflammation were obtained from the literature (<xref ref-type="bibr" rid="B43">43</xref>). The DNA methylation based stemness scores (DNAss) data and the RNA expression based stemness scores (RNAss) data derived by the Stemness group were downloaded from the UCSC Xena (<ext-link ext-link-type="uri" xlink:href="https://xenabrowser.net/">https://xenabrowser.net/</ext-link>).</p>
<p>HRD score data for genome-wide DNA damage footprints were downloaded from this database. HRD score assessed genomic instability caused by homologous recombination deficiency (HRD), including genomic loss of heterozygosity (LOH), telomere allele imbalance (TAI), and large segment migration (LST).</p>
<p>12 consensus group data for TCGA-BRCA classified according to their combined genomic and histological characteristics were obtained from the literature (<xref ref-type="bibr" rid="B20">20</xref>). Also, images that were assessed <italic>via</italic> TCGA digital slide archive (CDSA) (<ext-link ext-link-type="uri" xlink:href="http://cancer.digitalslidearchive.net/">http://cancer.digitalslidearchive.net/</ext-link>) were used for the histological interpretation of TCGA patients.</p>
<p>Drug response data and genomic markers of sensitivity related to breast cancer were downloaded from the Genomics of Drug Sensitivity in Cancer (GDSC) (<ext-link ext-link-type="uri" xlink:href="https://www.cancerrxgene.org/">https://www.cancerrxgene.org/</ext-link>) database.</p>
<p>The data of ligand-receptor interaction pairs was downloaded from the CellTalkDB (<ext-link ext-link-type="uri" xlink:href="http://tcm.zju.edu.cn/celltalkdb/">http://tcm.zju.edu.cn/celltalkdb/</ext-link>) database.</p>
<p>Spatial transcriptome data was obtained from the SOAR database (<ext-link ext-link-type="uri" xlink:href="https://soar.fsm.northwestern.edu/">https://soar.fsm.northwestern.edu/</ext-link>) and the spatial variability of genes in different cell types was analyzed in the SOAR database.</p>
</sec>
<sec id="s3_5">
<label>3.5</label>
<title>Consensus cluster on TCGA-BRCA samples</title>
<p>The R package &#x2018;ConsensusClusterPlus&#x2019; (version 1.54.0) was used to perform consistent clustering on the GDTEC matrix, with four breast cancer subtypes with significantly different survival prognoses identified. <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Material 1</bold>
</xref> provides details.</p>
</sec>
<sec id="s3_6">
<label>3.6</label>
<title>Kaplan-Meier and Log-rank test</title>
<p>We used the R packages &#x2018;survival&#x2019; (version 3.2-7) and &#x2018;survminer&#x2019; (version 0.4.9) to calculate the survival difference among subtypes, log rank p &lt; 0.05 represents a significant difference.</p>
</sec>
<sec id="s3_7">
<label>3.7</label>
<title>Gene ontology (GO) functional enrichment analysis</title>
<p>The &#x2018;clusterProfiler&#x2019; package and the &#x2018;org.hs.eg.db&#x2019; package in R were downloaded and their enrichGO function was used to perform functional enrichment analysis on the feature genes. Then, the enrichment results were visualized using functions (emapplot, emapplot, etc.) from the R package &#x2018;enrichplot&#x2019;.</p>
</sec>
<sec id="s3_8">
<label>3.8</label>
<title>MCP to calculate the cell infiltration fraction</title>
<p>The infiltration fraction of immune cell was calculated using the R package MCPcounter (version 1.2.0) (<ext-link ext-link-type="uri" xlink:href="https://github.com/ebecht/MCPcounter">https://github.com/ebecht/MCPcounter</ext-link>) based on the gene expression data in TCGA-BRCA.</p>
</sec>
<sec id="s3_9">
<label>3.9</label>
<title>GSVA to calculate the enrichment score of 14 cell states and 4 types of T cell disorders</title>
<p>Gene Set Variation Analysis (GSVA) is a non-parametric, unsupervised method that estimates the enrichment score of each gene set based on gene expression level. We used R package &#x2018;GSVA&#x2019; (version 1.38.2) to calculate the enrichment scores of 14 cancer-related functional states and 4 types of T cell disorders for each sample based on the gene expression data. Cell status data was downloaded from the CancerSEA (<ext-link ext-link-type="uri" xlink:href="http://biocc.hrbmu.edu.cn/CancerSEA/home.jsp">http://biocc.hrbmu.edu.cn/CancerSEA/home.jsp</ext-link>) database for a total of 1574 genes related to various functional states. 433 genes regarded to be associated with T-cell disorders were obtained from the literature (<xref ref-type="bibr" rid="B44">44</xref>, <xref ref-type="bibr" rid="B45">45</xref>).</p>
</sec>
<sec id="s3_10">
<label>3.10</label>
<title>Cox proportional hazards regression model and the Mix_Sub subtype classifier</title>
<p>We constructed prognostic risk models and subtype classifiers for the Mix_Sub subtype using a Cox proportional hazards regression model and a random forest approach. More information can be found in <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Material 1</bold>
</xref>.</p>
</sec>
</sec>
<sec id="s4" sec-type="discussion">
<label>4</label>
<title>Discussion</title>
<p>Breast cancer is a highly heterogeneous disease, and the identification of subtypes is important for the accurate diagnosis and personalized treatment of patients. Meanwhile, the development of fusion analysis of multi-omics data has advanced the understanding of cancer subtypes. However, most previous studies were performed based on correlations between multi-omics data and only considered associations between single aspects of omics, such as correlation analysis between somatic mutations and transcriptome expression, and correlation analysis between copy number variation and transcriptome expression. And cancer typing based on the driving relationships between omics remains to be explored.</p>
<p>In this study, we proposed a novel multi-omics fusion approach for breast cancer typing, which focuses on the driving relationship between the genome and transcriptome, where the genomic level includes somatic mutations and copy number variation. We expressed the driving relationships as dichotomous variables and fused them into a matrix. We identified four subtypes based on this relationship matrix and found that the Mix_Sub subtype was associated with the worst survival rate, but it contained a smaller number of triple-negative breast cancers that are currently considered difficult to treat. Subsequently, the Mix_Sub subtype was found to be significantly different from other subtypes in terms of phenotype, tumor microenvironment, intercellular communication, and cell states, and revealed that its worst survival may be the result of the combined effects of a large number of his altered biological functions and cellular status, higher T-cell disorders and HRD, lower immune cell infiltration, inflammatory response, and tumor malignancy and blocked cell-cell communication. It was also found that it may be more suitable for targeted drug therapy. Finally, based on the differences in driving relationships among patients with different subtypes, we identified 31 differential genes as biomarkers and used them to construct a risk prognostic model and a subtype classifier for the Mix_Sub subtype. Considering the abundance and availability of gene expression data, we also constructed a risk prognostic model and a subtype classifier for the Mix_Sub subtype using a subset of these biomarkers at the gene expression level only. And the generalization ability of these 2 levels of subtype classifiers and prognostic models was validated in 4 GEO datasets. Additionally, the identified prognostic risk genes showed significant spatial variability in malignant cells, highlighting their reliability and potential prognostic significance.</p>
<p>Moreover, when setting the threshold of LFC for determining whether a gene is abnormally expressed, we have chosen a more reasonable threshold of LFC by considering the factors of the robustness of GDTEC matrixes generated under different thresholds of LFC, and the consistency of the consistent clustering results.</p>
<p>Overall, our results demonstrate the potential of our multi-omics fusion approach in enhancing our understanding of breast cancer heterogeneity. By fusing information from both the genome and transcriptome, our approach provides a new perspective for interpreting multi-omics data in complex diseases. Further studies are needed to validate our findings and to explore the application of our approach in other cancer types.</p>
</sec>
<sec id="s5" sec-type="conclusions">
<label>5</label>
<title>Conclusions</title>
<p>Our study sheds new light on the heterogeneity of breast cancer by identifying a novel hybrid subtype, Mix_Sub, with a poor prognosis and unique phenotypic and clinical features. Further investigation into the inter-omics driving relationship uncovered the complexity and distinctiveness of Mix_Sub, including its tumor microenvironment, cell states, and cell-cell communication. By identifying biomarkers with significant spatial variability in malignant tumor cells, we have developed effective Mix_Sub subtype classifiers and prognostic risk models. In conclusion, this work advances our understanding of breast cancer and highlights the importance of inter-omics analysis in uncovering the underlying mechanisms of complex diseases.</p>
</sec>
<sec id="s6" sec-type="data-availability">
<title>Data availability statement</title>
<p>The original contributions presented in the study are included in the article/<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Material</bold>
</xref>. Further inquiries can be directed to the corresponding author.</p>
</sec>
<sec id="s7" sec-type="author-contributions">
<title>Author contributions</title>
<p>Conceptualization: H-jW, X-lG, JB, and Z-zW; methodology: Z-zW and X-hL; validation: X-hL and NW; formal analysis: X-hL; resources: NW, X-lW, YG, XZ, S-hF, and F-fX; writing-original draft preparation: X-hL; writing-review and editing: X-lW, H-jW and Z-zW; visualization: X-hL; and supervision: H-jW, X-lG, JB, and Z-zW. All authors contributed to the article and approved the submitted version.</p>
</sec>
</body>
<back>
<sec id="s8" sec-type="funding-information">
<title>Funding</title>
<p>This work was supported by the Natural Science Foundation of Hainan Province (No.821MS0777, 822MS074, 821MS045, 621MS041); National Natural Science Foundation of China (No.31701159,32160179); Major Science and Technology Program of Hainan Province (No.ZDKJ202003); Innovative Research Projects for Graduate Students of Hainan Medical University (HYYS2021B11); the Education Department of Hainan Province (No.Hnky2022-32); Hainan Province Clinical Medical Center.</p>
</sec>
<sec id="s9" sec-type="COI-statement">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec id="s10" sec-type="disclaimer">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec id="s11" sec-type="supplementary-material">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fonc.2023.1130092/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fonc.2023.1130092/full#supplementary-material</ext-link>
</p>
<supplementary-material xlink:href="DataSheet_1.docx" id="SM1" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<label>1</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Reis-Filho</surname> <given-names>JS</given-names>
</name>
<name>
<surname>Pusztai</surname> <given-names>L</given-names>
</name>
</person-group>. <article-title>Gene expression profiling in breast cancer: classification, prognostication, and prediction</article-title>. <source>Lancet</source> (<year>2011</year>) <volume>378</volume>(<issue>9805</issue>):<page-range>1812&#x2013;23</page-range>. doi: <pub-id pub-id-type="doi">10.1016/S0140-6736(11)61539-0</pub-id>
</citation>
</ref>
<ref id="B2">
<label>2</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Waks</surname> <given-names>AG</given-names>
</name>
<name>
<surname>Winer</surname> <given-names>EP</given-names>
</name>
</person-group>. <article-title>Breast cancer treatment: A review</article-title>. <source>JAMA</source> (<year>2019</year>) <volume>321</volume>(<issue>3</issue>):<page-range>288&#x2013;300</page-range>. doi: <pub-id pub-id-type="doi">10.1001/jama.2018.19323</pub-id>
</citation>
</ref>
<ref id="B3">
<label>3</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tao</surname> <given-names>M</given-names>
</name>
<name>
<surname>Song</surname> <given-names>T</given-names>
</name>
<name>
<surname>Du</surname> <given-names>W</given-names>
</name>
<name>
<surname>Han</surname> <given-names>S</given-names>
</name>
<name>
<surname>Zuo</surname> <given-names>C</given-names>
</name>
<name>
<surname>Li</surname> <given-names>Y</given-names>
</name>
<etal/>
</person-group>. <article-title>Classifying breast cancer subtypes using multiple kernel learning based on omics data</article-title>. <source>Genes (Basel)</source> (<year>2019</year>) <volume>10</volume>(<issue>3</issue>):<fpage>200</fpage>. doi: <pub-id pub-id-type="doi">10.3390/genes10030200</pub-id>
</citation>
</ref>
<ref id="B4">
<label>4</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Parker</surname> <given-names>JS</given-names>
</name>
<name>
<surname>Mullins</surname> <given-names>M</given-names>
</name>
<name>
<surname>Cheang</surname> <given-names>MC</given-names>
</name>
<name>
<surname>Leung</surname> <given-names>S</given-names>
</name>
<name>
<surname>Voduc</surname> <given-names>D</given-names>
</name>
<name>
<surname>Vickery</surname> <given-names>T</given-names>
</name>
<etal/>
</person-group>. <article-title>Supervised risk predictor of breast cancer based on intrinsic subtypes</article-title>. <source>J Clin Oncol</source> (<year>2009</year>) <volume>27</volume>(<issue>8</issue>):<page-range>1160&#x2013;7</page-range>. doi: <pub-id pub-id-type="doi">10.1200/JCO.2008.18.1370</pub-id>
</citation>
</ref>
<ref id="B5">
<label>5</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Vural</surname> <given-names>S</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>X</given-names>
</name>
<name>
<surname>Guda</surname> <given-names>C</given-names>
</name>
</person-group>. <article-title>Classification of breast cancer patients using somatic mutation profiles and machine learning approaches</article-title>. <source>BMC Syst Biol</source> (<year>2016</year>) <volume>10</volume>(<supplement>Suppl 3</supplement>):<fpage>62</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s12918-016-0306-z</pub-id>
</citation>
</ref>
<ref id="B6">
<label>6</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Andre</surname> <given-names>F</given-names>
</name>
<name>
<surname>Job</surname> <given-names>B</given-names>
</name>
<name>
<surname>Dessen</surname> <given-names>P</given-names>
</name>
<name>
<surname>Tordai</surname> <given-names>A</given-names>
</name>
<name>
<surname>Michiels</surname> <given-names>S</given-names>
</name>
<name>
<surname>Liedtke</surname> <given-names>C</given-names>
</name>
<etal/>
</person-group>. <article-title>Molecular characterization of breast cancer with high-resolution oligonucleotide comparative genomic hybridization array</article-title>. <source>Clin Cancer Res</source> (<year>2009</year>) <volume>15</volume>(<issue>2</issue>):<page-range>441&#x2013;51</page-range>. doi: <pub-id pub-id-type="doi">10.1158/1078-0432.CCR-08-1791</pub-id>
</citation>
</ref>
<ref id="B7">
<label>7</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bhattacharyya</surname> <given-names>M</given-names>
</name>
<name>
<surname>Nath</surname> <given-names>J</given-names>
</name>
<name>
<surname>Bandyopadhyay</surname> <given-names>S</given-names>
</name>
</person-group>. <article-title>MicroRNA signatures highlight new breast cancer subtypes</article-title>. <source>Gene</source> (<year>2015</year>) <volume>556</volume>(<issue>2</issue>):<page-range>192&#x2013;8</page-range>. doi: <pub-id pub-id-type="doi">10.1016/j.gene.2014.11.053</pub-id>
</citation>
</ref>
<ref id="B8">
<label>8</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gomez-Cabrero</surname> <given-names>D</given-names>
</name>
<name>
<surname>Abugessaisa</surname> <given-names>I</given-names>
</name>
<name>
<surname>Maier</surname> <given-names>D</given-names>
</name>
<name>
<surname>Teschendorff</surname> <given-names>A</given-names>
</name>
<name>
<surname>Merkenschlager</surname> <given-names>M</given-names>
</name>
<name>
<surname>Gisel</surname> <given-names>A</given-names>
</name>
<etal/>
</person-group>. <article-title>Data integration in the era of omics: current and future challenges</article-title>. <source>BMC Syst Biol</source> (<year>2014</year>) <volume>8</volume>(<supplement>Suppl 2</supplement>):<fpage>l1</fpage>. doi: <pub-id pub-id-type="doi">10.1186/1752-0509-8-S2-I1</pub-id>
</citation>
</ref>
<ref id="B9">
<label>9</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lin</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>W</given-names>
</name>
<name>
<surname>Cao</surname> <given-names>H</given-names>
</name>
<name>
<surname>Li</surname> <given-names>G</given-names>
</name>
<name>
<surname>Du</surname> <given-names>W</given-names>
</name>
</person-group>. <article-title>Classifying breast cancer subtypes using deep neural networks based on multi-omics data</article-title>. <source>Genes (Basel)</source> (<year>2020</year>) <volume>11</volume>(<issue>8</issue>):<fpage>888</fpage>. doi: <pub-id pub-id-type="doi">10.3390/genes11080888</pub-id>
</citation>
</ref>
<ref id="B10">
<label>10</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Curtis</surname> <given-names>C</given-names>
</name>
<name>
<surname>Shah</surname> <given-names>SP</given-names>
</name>
<name>
<surname>Chin</surname> <given-names>SF</given-names>
</name>
<name>
<surname>Turashvili</surname> <given-names>G</given-names>
</name>
<name>
<surname>Rueda</surname> <given-names>OM</given-names>
</name>
<name>
<surname>Dunning</surname> <given-names>MJ</given-names>
</name>
<etal/>
</person-group>. <article-title>The genomic and transcriptomic architecture of 2,000 breast tumours reveals novel subgroups</article-title>. <source>Nature</source> (<year>2012</year>) <volume>486</volume>(<issue>7403</issue>):<page-range>346&#x2013;52</page-range>. doi: <pub-id pub-id-type="doi">10.1038/nature10983</pub-id>
</citation>
</ref>
<ref id="B11">
<label>11</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shen</surname> <given-names>R</given-names>
</name>
<name>
<surname>Olshen</surname> <given-names>AB</given-names>
</name>
<name>
<surname>Ladanyi</surname> <given-names>M</given-names>
</name>
</person-group>. <article-title>Integrative clustering of multiple genomic data types using a joint latent variable model with application to breast and lung cancer subtype analysis</article-title>. <source>Bioinformatics</source> (<year>2009</year>) <volume>25</volume>(<issue>22</issue>):<page-range>2906&#x2013;12</page-range>. doi: <pub-id pub-id-type="doi">10.1093/bioinformatics/btp543</pub-id>
</citation>
</ref>
<ref id="B12">
<label>12</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Netanely</surname> <given-names>D</given-names>
</name>
<name>
<surname>Avraham</surname> <given-names>A</given-names>
</name>
<name>
<surname>Ben-Baruch</surname> <given-names>A</given-names>
</name>
<name>
<surname>Evron</surname> <given-names>E</given-names>
</name>
<name>
<surname>Shamir</surname> <given-names>R</given-names>
</name>
</person-group>. <article-title>Expression and methylation patterns partition luminal-a breast tumors into distinct prognostic subgroups</article-title>. <source>Breast Cancer Res</source> (<year>2016</year>) <volume>18</volume>(<issue>1</issue>):<fpage>74</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s13058-016-0724-2</pub-id>
</citation>
</ref>
<ref id="B13">
<label>13</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nguyen</surname> <given-names>QH</given-names>
</name>
<name>
<surname>Nguyen</surname> <given-names>H</given-names>
</name>
<name>
<surname>Nguyen</surname> <given-names>T</given-names>
</name>
<name>
<surname>Le</surname> <given-names>DH</given-names>
</name>
</person-group>. <article-title>Multi-omics analysis detects novel prognostic subgroups of breast cancer</article-title>. <source>Front Genet</source> (<year>2020</year>) <volume>11</volume>:<elocation-id>574661</elocation-id>. doi: <pub-id pub-id-type="doi">10.3389/fgene.2020.574661</pub-id>
</citation>
</ref>
<ref id="B14">
<label>14</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hanahan</surname> <given-names>D</given-names>
</name>
<name>
<surname>Weinberg</surname> <given-names>RA</given-names>
</name>
</person-group>. <article-title>Hallmarks of cancer: the next generation</article-title>. <source>Cell</source> (<year>2011</year>) <volume>144</volume>(<issue>5</issue>):<page-range>646&#x2013;74</page-range>. doi: <pub-id pub-id-type="doi">10.1016/j.cell.2011.02.013</pub-id>
</citation>
</ref>
<ref id="B15">
<label>15</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Borellini</surname> <given-names>F</given-names>
</name>
<name>
<surname>Oka</surname> <given-names>T</given-names>
</name>
</person-group>. <article-title>Growth control and differentiation in mammary epithelial cells</article-title>. <source>Environ Health Perspect</source> (<year>1989</year>) <volume>80</volume>:<fpage>85</fpage>&#x2013;<lpage>99</lpage>. doi: <pub-id pub-id-type="doi">10.1289/ehp.898085</pub-id>
</citation>
</ref>
<ref id="B16">
<label>16</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Payne</surname> <given-names>SL</given-names>
</name>
<name>
<surname>Fogelgren</surname> <given-names>B</given-names>
</name>
<name>
<surname>Hess</surname> <given-names>AR</given-names>
</name>
<name>
<surname>Seftor</surname> <given-names>EA</given-names>
</name>
<name>
<surname>Wiley</surname> <given-names>EL</given-names>
</name>
<name>
<surname>Fong</surname> <given-names>SF</given-names>
</name>
<etal/>
</person-group>. <article-title>Lysyl oxidase regulates breast cancer cell migration and adhesion through a hydrogen peroxide-mediated mechanism</article-title>. <source>Cancer Res</source> (<year>2005</year>) <volume>65</volume>(<issue>24</issue>):<page-range>11429&#x2013;36</page-range>. doi: <pub-id pub-id-type="doi">10.1158/0008-5472.CAN-05-1274</pub-id>
</citation>
</ref>
<ref id="B17">
<label>17</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gee</surname> <given-names>JM</given-names>
</name>
<name>
<surname>Robertson</surname> <given-names>JF</given-names>
</name>
<name>
<surname>Ellis</surname> <given-names>IO</given-names>
</name>
<name>
<surname>Nicholson</surname> <given-names>RI</given-names>
</name>
</person-group>. <article-title>Phosphorylation of ERK1/2 mitogen-activated protein kinase is associated with poor response to anti-hormonal therapy and decreased patient survival in clinical breast cancer</article-title>. <source>Int J Cancer</source> (<year>2001</year>) <volume>95</volume>(<issue>4</issue>):<page-range>247&#x2013;54</page-range>. doi: <pub-id pub-id-type="doi">10.1002/1097-0215(20010720)95:4&lt;247::AID-IJC1042&gt;3.0.CO;2-S</pub-id>
</citation>
</ref>
<ref id="B18">
<label>18</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Baghban</surname> <given-names>R</given-names>
</name>
<name>
<surname>Roshangar</surname> <given-names>L</given-names>
</name>
<name>
<surname>Jahanban-Esfahlan</surname> <given-names>R</given-names>
</name>
<name>
<surname>Seidi</surname> <given-names>K</given-names>
</name>
<name>
<surname>Ebrahimi-Kalan</surname> <given-names>A</given-names>
</name>
<name>
<surname>Jaymand</surname> <given-names>M</given-names>
</name>
<etal/>
</person-group>. <article-title>Tumor microenvironment complexity and therapeutic implications at a glance</article-title>. <source>Cell Commun Signal</source> (<year>2020</year>) <volume>18</volume>(<issue>1</issue>):<fpage>59</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s12964-020-0530-4</pub-id>
</citation>
</ref>
<ref id="B19">
<label>19</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nunes</surname> <given-names>SC</given-names>
</name>
</person-group>. <article-title>Tumor microenvironment - selective pressures boosting cancer progression</article-title>. <source>Adv Exp Med Biol</source> (<year>2020</year>) <volume>1219</volume>:<fpage>35</fpage>&#x2013;<lpage>49</lpage>. doi: <pub-id pub-id-type="doi">10.1007/978-3-030-34025-4_2</pub-id>
</citation>
</ref>
<ref id="B20">
<label>20</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Thennavan</surname> <given-names>A</given-names>
</name>
<name>
<surname>Beca</surname> <given-names>F</given-names>
</name>
<name>
<surname>Xia</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Recio</surname> <given-names>SG</given-names>
</name>
<name>
<surname>Allison</surname> <given-names>K</given-names>
</name>
<name>
<surname>Collins</surname> <given-names>LC</given-names>
</name>
<etal/>
</person-group>. <article-title>Molecular analysis of TCGA breast cancer histologic types</article-title>. <source>Cell Genom</source> (<year>2021</year>) <volume>1</volume>(<issue>3</issue>):<fpage>100067</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.xgen.2021.100067</pub-id>
</citation>
</ref>
<ref id="B21">
<label>21</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Roberto</surname> <given-names>M</given-names>
</name>
<name>
<surname>Astone</surname> <given-names>A</given-names>
</name>
<name>
<surname>Botticelli</surname> <given-names>A</given-names>
</name>
<name>
<surname>Carbognin</surname> <given-names>L</given-names>
</name>
<name>
<surname>Cassano</surname> <given-names>A</given-names>
</name>
<name>
<surname>D'Auria</surname> <given-names>G</given-names>
</name>
<etal/>
</person-group>. <article-title>CDK4/6 inhibitor treatments in patients with hormone receptor positive, Her2 negative advanced breast cancer: Potential molecular mechanisms, clinical implications and future perspectives</article-title>. <source>Cancers (Basel)</source> (<year>2021</year>) <volume>13</volume>(<issue>2</issue>):<fpage>332</fpage>. doi: <pub-id pub-id-type="doi">10.3390/cancers13020332</pub-id>
</citation>
</ref>
<ref id="B22">
<label>22</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Brase</surname> <given-names>JC</given-names>
</name>
<name>
<surname>Schmidt</surname> <given-names>M</given-names>
</name>
<name>
<surname>Fischbach</surname> <given-names>T</given-names>
</name>
<name>
<surname>Sultmann</surname> <given-names>H</given-names>
</name>
<name>
<surname>Bojar</surname> <given-names>H</given-names>
</name>
<name>
<surname>Koelbl</surname> <given-names>H</given-names>
</name>
<etal/>
</person-group>. <article-title>ERBB2 and TOP2A in breast cancer: A comprehensive analysis of gene amplification, RNA levels, and protein expression and their influence on prognosis and prediction</article-title>. <source>Clin Cancer Res</source> (<year>2010</year>) <volume>16</volume>(<issue>8</issue>):<page-range>2391&#x2013;401</page-range>. doi: <pub-id pub-id-type="doi">10.1158/1078-0432.CCR-09-2471</pub-id>
</citation>
</ref>
<ref id="B23">
<label>23</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nevedomskaya</surname> <given-names>E</given-names>
</name>
<name>
<surname>Perryman</surname> <given-names>R</given-names>
</name>
<name>
<surname>Solanki</surname> <given-names>S</given-names>
</name>
<name>
<surname>Syed</surname> <given-names>N</given-names>
</name>
<name>
<surname>Mayboroda</surname> <given-names>OA</given-names>
</name>
<name>
<surname>Keun</surname> <given-names>HC</given-names>
</name>
</person-group>. <article-title>A systems oncology approach identifies NT5E as a key metabolic regulator in tumor cells and modulator of platinum sensitivity</article-title>. <source>J Proteome Res</source> (<year>2016</year>) <volume>15</volume>(<issue>1</issue>):<page-range>280&#x2013;90</page-range>. doi: <pub-id pub-id-type="doi">10.1021/acs.jproteome.5b00793</pub-id>
</citation>
</ref>
<ref id="B24">
<label>24</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yuan</surname> <given-names>H</given-names>
</name>
<name>
<surname>Yan</surname> <given-names>M</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>G</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>W</given-names>
</name>
<name>
<surname>Deng</surname> <given-names>C</given-names>
</name>
<name>
<surname>Liao</surname> <given-names>G</given-names>
</name>
<etal/>
</person-group>. <article-title>CancerSEA: A cancer single-cell state atlas</article-title>. <source>Nucleic Acids Res</source> (<year>2019</year>) <volume>47</volume>(<issue>D1</issue>):<page-range>D900&#x2013;8</page-range>. doi: <pub-id pub-id-type="doi">10.1093/nar/gky939</pub-id>
</citation>
</ref>
<ref id="B25">
<label>25</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ali</surname> <given-names>RMM</given-names>
</name>
<name>
<surname>Mcintosh</surname> <given-names>SA</given-names>
</name>
<name>
<surname>Savage</surname> <given-names>KI</given-names>
</name>
</person-group>. <article-title>Homologous recombination deficiency in breast cancer: Implications for risk, cancer development, and therapy</article-title>. <source>Genes Chromosomes Cancer</source> (<year>2021</year>) <volume>60</volume>(<issue>5</issue>):<page-range>358&#x2013;72</page-range>. doi: <pub-id pub-id-type="doi">10.1002/gcc.22921</pub-id>
</citation>
</ref>
<ref id="B26">
<label>26</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sharma</surname> <given-names>P</given-names>
</name>
<name>
<surname>Barlow</surname> <given-names>WE</given-names>
</name>
<name>
<surname>Godwin</surname> <given-names>AK</given-names>
</name>
<name>
<surname>Pathak</surname> <given-names>H</given-names>
</name>
<name>
<surname>Isakova</surname> <given-names>K</given-names>
</name>
<name>
<surname>Williams</surname> <given-names>D</given-names>
</name>
<etal/>
</person-group>. <article-title>Impact of homologous recombination deficiency biomarkers on outcomes in patients with triple-negative breast cancer treated with adjuvant doxorubicin and cyclophosphamide (SWOG S9313)</article-title>. <source>Ann Oncol</source> (<year>2018</year>) <volume>29</volume>(<issue>3</issue>):<page-range>654&#x2013;60</page-range>. doi: <pub-id pub-id-type="doi">10.1093/annonc/mdx821</pub-id>
</citation>
</ref>
<ref id="B27">
<label>27</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ramilowski</surname> <given-names>JA</given-names>
</name>
<name>
<surname>Goldberg</surname> <given-names>T</given-names>
</name>
<name>
<surname>Harshbarger</surname> <given-names>J</given-names>
</name>
<name>
<surname>Kloppmann</surname> <given-names>E</given-names>
</name>
<name>
<surname>Lizio</surname> <given-names>M</given-names>
</name>
<name>
<surname>Satagopam</surname> <given-names>VP</given-names>
</name>
<etal/>
</person-group>. <article-title>A draft network of ligand-receptor-mediated multicellular signalling in human</article-title>. <source>Nat Commun</source> (<year>2015</year>) <volume>6</volume>:<fpage>7866</fpage>. doi: <pub-id pub-id-type="doi">10.1038/ncomms8866</pub-id>
</citation>
</ref>
<ref id="B28">
<label>28</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Prasad</surname> <given-names>CP</given-names>
</name>
<name>
<surname>Chaurasiya</surname> <given-names>SK</given-names>
</name>
<name>
<surname>Guilmain</surname> <given-names>W</given-names>
</name>
<name>
<surname>Andersson</surname> <given-names>T</given-names>
</name>
</person-group>. <article-title>WNT5A signaling impairs breast cancer cell migration and invasion <italic>via</italic> mechanisms independent of the epithelial-mesenchymal transition</article-title>. <source>J Exp Clin Cancer Res</source> (<year>2016</year>) <volume>35</volume>(<issue>1</issue>):<fpage>144</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s13046-016-0421-0</pub-id>
</citation>
</ref>
<ref id="B29">
<label>29</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Specht</surname> <given-names>K</given-names>
</name>
<name>
<surname>Harbeck</surname> <given-names>N</given-names>
</name>
<name>
<surname>Smida</surname> <given-names>J</given-names>
</name>
<name>
<surname>Annecke</surname> <given-names>K</given-names>
</name>
<name>
<surname>Reich</surname> <given-names>U</given-names>
</name>
<name>
<surname>Naehrig</surname> <given-names>J</given-names>
</name>
<etal/>
</person-group>. <article-title>Expression profiling identifies genes that predict recurrence of breast cancer after adjuvant CMF-based chemotherapy</article-title>. <source>Breast Cancer Res Treat</source> (<year>2009</year>) <volume>118</volume>(<issue>1</issue>):<fpage>45</fpage>&#x2013;<lpage>56</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s10549-008-0207-y</pub-id>
</citation>
</ref>
<ref id="B30">
<label>30</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zamai</surname> <given-names>M</given-names>
</name>
<name>
<surname>Trullo</surname> <given-names>A</given-names>
</name>
<name>
<surname>Giordano</surname> <given-names>M</given-names>
</name>
<name>
<surname>Corti</surname> <given-names>V</given-names>
</name>
<name>
<surname>Arza Cuesta</surname> <given-names>E</given-names>
</name>
<name>
<surname>Francavilla</surname> <given-names>C</given-names>
</name>
<etal/>
</person-group>. <article-title>Number and brightness analysis reveals that NCAM and FGF2 elicit different assembly and dynamics of FGFR1 in live cells</article-title>. <source>J Cell Sci</source> (<year>2019</year>) <volume>132</volume>(<issue>1</issue>). doi: <pub-id pub-id-type="doi">10.1242/jcs.220624</pub-id>
</citation>
</ref>
<ref id="B31">
<label>31</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Guan</surname> <given-names>F</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>X</given-names>
</name>
<name>
<surname>He</surname> <given-names>F</given-names>
</name>
</person-group>. <article-title>Promotion of cell migration by neural cell adhesion molecule (NCAM) is enhanced by PSA in a polysialyltransferase-specific manner</article-title>. <source>PloS One</source> (<year>2015</year>) <volume>10</volume>(<issue>4</issue>):<elocation-id>e0124237</elocation-id>. doi: <pub-id pub-id-type="doi">10.1371/journal.pone.0124237</pub-id>
</citation>
</ref>
<ref id="B32">
<label>32</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Soroka</surname> <given-names>V</given-names>
</name>
<name>
<surname>Kolkova</surname> <given-names>K</given-names>
</name>
<name>
<surname>Kastrup</surname> <given-names>JS</given-names>
</name>
<name>
<surname>Diederichs</surname> <given-names>K</given-names>
</name>
<name>
<surname>Breed</surname> <given-names>J</given-names>
</name>
<name>
<surname>Kiselyov</surname> <given-names>VV</given-names>
</name>
<etal/>
</person-group>. <article-title>Structure and interactions of NCAM Ig1-2-3 suggest a novel zipper mechanism for homophilic adhesion</article-title>. <source>Structure</source> (<year>2003</year>) <volume>11</volume>(<issue>10</issue>):<page-range>1291&#x2013;301</page-range>. doi: <pub-id pub-id-type="doi">10.1016/j.str.2003.09.006</pub-id>
</citation>
</ref>
<ref id="B33">
<label>33</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Christensen</surname> <given-names>C</given-names>
</name>
<name>
<surname>Berezin</surname> <given-names>V</given-names>
</name>
<name>
<surname>Bock</surname> <given-names>E</given-names>
</name>
</person-group>. <article-title>Neural cell adhesion molecule differentially interacts with isoforms of the fibroblast growth factor receptor</article-title>. <source>Neuroreport</source> (<year>2011</year>) <volume>22</volume>(<issue>15</issue>):<page-range>727&#x2013;32</page-range>. doi: <pub-id pub-id-type="doi">10.1097/WNR.0b013e3283491682</pub-id>
</citation>
</ref>
<ref id="B34">
<label>34</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Saffell</surname> <given-names>JL</given-names>
</name>
<name>
<surname>Walsh</surname> <given-names>FS</given-names>
</name>
<name>
<surname>Doherty</surname> <given-names>P</given-names>
</name>
</person-group>. <article-title>Expression of NCAM containing VASE in neurons can account for a developmental loss in their neurite outgrowth response to NCAM in a cellular substratum</article-title>. <source>J Cell Biol</source> (<year>1994</year>) <volume>125</volume>(<issue>2</issue>):<page-range>427&#x2013;36</page-range>. doi: <pub-id pub-id-type="doi">10.1083/jcb.125.2.427</pub-id>
</citation>
</ref>
<ref id="B35">
<label>35</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Francavilla</surname> <given-names>C</given-names>
</name>
<name>
<surname>Cattaneo</surname> <given-names>P</given-names>
</name>
<name>
<surname>Berezin</surname> <given-names>V</given-names>
</name>
<name>
<surname>Bock</surname> <given-names>E</given-names>
</name>
<name>
<surname>Ami</surname> <given-names>D</given-names>
</name>
<name>
<surname>de Marco</surname> <given-names>A</given-names>
</name>
<etal/>
</person-group>. <article-title>The binding of NCAM to FGFR1 induces a specific cellular response mediated by receptor trafficking</article-title>. <source>J Cell Biol</source> (<year>2009</year>) <volume>187</volume>(<issue>7</issue>):<page-range>1101&#x2013;16</page-range>. doi: <pub-id pub-id-type="doi">10.1083/jcb.200903030</pub-id>
</citation>
</ref>
<ref id="B36">
<label>36</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Suzuki</surname> <given-names>M</given-names>
</name>
<name>
<surname>Patel</surname> <given-names>K</given-names>
</name>
<name>
<surname>Huang</surname> <given-names>C-C</given-names>
</name>
<name>
<surname>Costa</surname> <given-names>FDA</given-names>
</name>
<name>
<surname>Kondo</surname> <given-names>A</given-names>
</name>
<name>
<surname>Soares</surname> <given-names>FA</given-names>
</name>
<etal/>
</person-group>. <article-title>Loss of expression of the neural cell adhesion molecule 1 (NCAM1) in atypical teratoid/rhabdoid tumors: a new diagnostic marker</article-title>? <source>Appl Cancer Res</source> (<year>2017</year>) <volume>37</volume>(<issue>1</issue>):<fpage>14</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s41241-017-0025-9</pub-id>
</citation>
</ref>
<ref id="B37">
<label>37</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Scarpino</surname> <given-names>S</given-names>
</name>
<name>
<surname>Di Napoli</surname> <given-names>A</given-names>
</name>
<name>
<surname>Melotti</surname> <given-names>F</given-names>
</name>
<name>
<surname>Talerico</surname> <given-names>C</given-names>
</name>
<name>
<surname>Cancrini</surname> <given-names>A</given-names>
</name>
<name>
<surname>Ruco</surname> <given-names>L</given-names>
</name>
</person-group>. <article-title>Papillary carcinoma of the thyroid: Low expression of NCAM (CD56) is associated with downregulation of VEGF-d production by tumour cells</article-title>. <source>J Pathol</source> (<year>2007</year>) <volume>212</volume>(<issue>4</issue>):<page-range>411&#x2013;9</page-range>. doi: <pub-id pub-id-type="doi">10.1002/path.2183</pub-id>
</citation>
</ref>
<ref id="B38">
<label>38</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bednarek</surname> <given-names>R</given-names>
</name>
<name>
<surname>Selmi</surname> <given-names>A</given-names>
</name>
<name>
<surname>Wojkowska</surname> <given-names>D</given-names>
</name>
<name>
<surname>Karolczak</surname> <given-names>K</given-names>
</name>
<name>
<surname>Popielarski</surname> <given-names>M</given-names>
</name>
<name>
<surname>Stasiak</surname> <given-names>M</given-names>
</name>
<etal/>
</person-group>. <article-title>Functional inhibition of F11 receptor (F11R/junctional adhesion molecule-A/JAM-A) activity by a F11R-derived peptide in breast cancer and its microenvironment</article-title>. <source>Breast Cancer Res Treat</source> (<year>2020</year>) <volume>179</volume>(<issue>2</issue>):<page-range>325&#x2013;35</page-range>. doi: <pub-id pub-id-type="doi">10.1007/s10549-019-05471-x</pub-id>
</citation>
</ref>
<ref id="B39">
<label>39</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yang</surname> <given-names>X</given-names>
</name>
<name>
<surname>An</surname> <given-names>L</given-names>
</name>
<name>
<surname>Li</surname> <given-names>X</given-names>
</name>
</person-group>. <article-title>NDRG3 and NDRG4, two novel tumor-related genes</article-title>. <source>BioMed Pharmacother</source> (<year>2013</year>) <volume>67</volume>(<issue>7</issue>):<page-range>681&#x2013;4</page-range>. doi: <pub-id pub-id-type="doi">10.1016/j.biopha.2013.04.009</pub-id>
</citation>
</ref>
<ref id="B40">
<label>40</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Santana-Codina</surname> <given-names>N</given-names>
</name>
<name>
<surname>Mancias</surname> <given-names>JD</given-names>
</name>
<name>
<surname>Kimmelman</surname> <given-names>AC</given-names>
</name>
</person-group>. <article-title>The role of autophagy in cancer</article-title>. <source>Annu Rev Cancer Biol</source> (<year>2017</year>) <volume>1</volume>:<fpage>19</fpage>&#x2013;<lpage>39</lpage>. doi: <pub-id pub-id-type="doi">10.1146/annurev-cancerbio-041816-122338</pub-id>
</citation>
</ref>
<ref id="B41">
<label>41</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lanigan</surname> <given-names>F</given-names>
</name>
<name>
<surname>O'connor</surname> <given-names>D</given-names>
</name>
<name>
<surname>Martin</surname> <given-names>F</given-names>
</name>
<name>
<surname>Gallagher</surname> <given-names>WM</given-names>
</name>
</person-group>. <article-title>Molecular links between mammary gland development and breast cancer</article-title>. <source>Cell Mol Life Sci</source> (<year>2007</year>) <volume>64</volume>(<issue>24</issue>):<page-range>3159&#x2013;84</page-range>. doi: <pub-id pub-id-type="doi">10.1007/s00018-007-7386-2</pub-id>
</citation>
</ref>
<ref id="B42">
<label>42</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Thorsson</surname> <given-names>V</given-names>
</name>
<name>
<surname>Gibbs</surname> <given-names>DL</given-names>
</name>
<name>
<surname>Brown</surname> <given-names>SD</given-names>
</name>
<name>
<surname>Wolf</surname> <given-names>D</given-names>
</name>
<name>
<surname>Bortone</surname> <given-names>DS</given-names>
</name>
<name>
<surname>Ou Yang</surname> <given-names>TH</given-names>
</name>
<etal/>
</person-group>. <article-title>The immune landscape of cancer</article-title>. <source>Immunity</source> (<year>2019</year>) <volume>51</volume>(<issue>2</issue>):<page-range>411&#x2013;2</page-range>. doi: <pub-id pub-id-type="doi">10.1016/j.immuni.2019.08.004</pub-id>
</citation>
</ref>
<ref id="B43">
<label>43</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bao</surname> <given-names>R</given-names>
</name>
<name>
<surname>Stapor</surname> <given-names>D</given-names>
</name>
<name>
<surname>Luke</surname> <given-names>JJ</given-names>
</name>
</person-group>. <article-title>Molecular correlates and therapeutic targets in T cell-inflamed versus non-T cell-inflamed tumors across cancer types</article-title>. <source>Genome Med</source> (<year>2020</year>) <volume>12</volume>(<issue>1</issue>):<fpage>90</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s13073-020-00787-6</pub-id>
</citation>
</ref>
<ref id="B44">
<label>44</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jiang</surname> <given-names>P</given-names>
</name>
<name>
<surname>Gu</surname> <given-names>S</given-names>
</name>
<name>
<surname>Pan</surname> <given-names>D</given-names>
</name>
<name>
<surname>Fu</surname> <given-names>J</given-names>
</name>
<name>
<surname>Sahu</surname> <given-names>A</given-names>
</name>
<name>
<surname>Hu</surname> <given-names>X</given-names>
</name>
<etal/>
</person-group>. <article-title>Signatures of T cell dysfunction and exclusion predict cancer immunotherapy response</article-title>. <source>Nat Med</source> (<year>2018</year>) <volume>24</volume>(<issue>10</issue>):<page-range>1550&#x2013;8</page-range>. doi: <pub-id pub-id-type="doi">10.1038/s41591-018-0136-1</pub-id>
</citation>
</ref>
<ref id="B45">
<label>45</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhao</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Shao</surname> <given-names>Q</given-names>
</name>
<name>
<surname>Peng</surname> <given-names>G</given-names>
</name>
</person-group>. <article-title>Exhaustion and senescence: two crucial dysfunctional states of T cells in the tumor microenvironment</article-title>. <source>Cell Mol Immunol</source> (<year>2020</year>) <volume>17</volume>(<issue>1</issue>):<fpage>27</fpage>&#x2013;<lpage>35</lpage>. doi: <pub-id pub-id-type="doi">10.1038/s41423-019-0344-8</pub-id>
</citation>
</ref>
</ref-list>
</back>
</article>