<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article article-type="research-article" dtd-version="2.3" xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Genet.</journal-id>
<journal-title>Frontiers in Genetics</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Genet.</abbrev-journal-title>
<issn pub-type="epub">1664-8021</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">733654</article-id>
<article-id pub-id-type="doi">10.3389/fgene.2021.733654</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Genetics</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Recurrence Risk of Liver Cancer Post-hepatectomy Using Machine Learning and Study of Correlation With Immune Infiltration</article-title>
<alt-title alt-title-type="left-running-head">Qian et&#x20;al.</alt-title>
<alt-title alt-title-type="right-running-head">Predicting Recurrence of Liver Cancer</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Qian</surname>
<given-names>Xiaowen</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Zheng</surname>
<given-names>Huilin</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1307963/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Xue</surname>
<given-names>Ke</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Chen</surname>
<given-names>Zheng</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Hu</surname>
<given-names>Zhenhua</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
<xref ref-type="aff" rid="aff5">
<sup>5</sup>
</xref>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Zhang</surname>
<given-names>Lei</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<uri xlink:href="https://loop.frontiersin.org/people/735431/overview"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Wan</surname>
<given-names>Jian</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
</contrib>
</contrib-group>
<aff id="aff1">
<label>
<sup>1</sup>
</label>Department of Information and Electronic Engineering, Zhejiang University of Science and Technology, <addr-line>Hangzhou</addr-line>, <country>China</country>
</aff>
<aff id="aff2">
<label>
<sup>2</sup>
</label>Department of Biological and Chemical Engineering, Zhejiang University of Science and Technology, <addr-line>Hangzhou</addr-line>, <country>China</country>
</aff>
<aff id="aff3">
<label>
<sup>3</sup>
</label>Division of Hepatobiliary and Pancreatic Surgery, Department of Surgery, Fourth Affiliated Hospital, School of Medicine, Zhejiang University, <addr-line>Yiwu</addr-line>, <country>China</country>
</aff>
<aff id="aff4">
<label>
<sup>4</sup>
</label>Key Laboratory of Combined Multi-Organ Transplantation, Division of Hepatobiliary and Pancreatic Surgery, Department of Surgery, First Affiliated Hospital, School of Medicine, Zhejiang University, Ministry of Public Health Key Laboratory of Organ Transplantation, <addr-line>Hangzhou</addr-line>, <country>China</country>
</aff>
<aff id="aff5">
<label>
<sup>5</sup>
</label>Division of Hepatobiliary and Pancreatic Surgery, Yiwu Central Hospital, <addr-line>Yiwu</addr-line>, <country>China</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>
<bold>Edited by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/865204/overview">Honghao Gao</ext-link>, Shanghai University, China</p>
</fn>
<fn fn-type="edited-by">
<p>
<bold>Reviewed by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/711875/overview">Nguyen Quoc Khanh Le</ext-link>, Taipei Medical University, Taiwan</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1259140/overview">Takayuki Shiomi</ext-link>, International University of Health and Welfare, Japan</p>
</fn>
<corresp id="c001">&#x2a;Correspondence: Huilin Zheng, <email>zhenghuilin@zust.edu.cn</email>; Lei Zhang, <email>papaver_rhoeas@126.com</email>; Jian Wan, <email>wanjian@zust.edu.cn</email>
</corresp>
<fn fn-type="other">
<p>This article was submitted to Computational Genomics, a section of the journal Frontiers in Genetics</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>08</day>
<month>12</month>
<year>2021</year>
</pub-date>
<pub-date pub-type="collection">
<year>2021</year>
</pub-date>
<volume>12</volume>
<elocation-id>733654</elocation-id>
<history>
<date date-type="received">
<day>30</day>
<month>06</month>
<year>2021</year>
</date>
<date date-type="accepted">
<day>24</day>
<month>11</month>
<year>2021</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2021 Qian, Zheng, Xue, Chen, Hu, Zhang and Wan.</copyright-statement>
<copyright-year>2021</copyright-year>
<copyright-holder>Qian, Zheng, Xue, Chen, Hu, Zhang and Wan</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these&#x20;terms.</p>
</license>
</permissions>
<abstract>
<p>Postoperative recurrence of liver cancer is the main obstacle to improving the survival rate of patients with liver cancer. We established an mRNA-based model to predict the risk of recurrence after hepatectomy for liver cancer and explored the relationship between immune infiltration and the risk of recurrence after hepatectomy for liver cancer. We performed a series of bioinformatics analyses on the gene expression profiles of patients with liver cancer, and selected 18 mRNAs as biomarkers for predicting the risk of recurrence of liver cancer using a machine learning method. At the same time, we evaluated the immune infiltration of the samples and conducted a joint analysis of the recurrence risk of liver cancer and found that B&#x20;cell, B&#x20;cell naive, T&#x20;cell CD4<sup>&#x2b;</sup> memory resting, and T&#x20;cell CD4<sup>&#x2b;</sup> were significantly correlated with the risk of postoperative recurrence of liver cancer. These results are helpful for early detection, intervention, and the individualized treatment of patients with liver cancer after surgical resection, and help to reveal the potential mechanism of liver cancer recurrence.</p>
</abstract>
<kwd-group>
<kwd>liver cancer</kwd>
<kwd>recurrence risk</kwd>
<kwd>machine learning</kwd>
<kwd>immune infiltration</kwd>
<kwd>TCGA</kwd>
</kwd-group>
</article-meta>
</front>
<body>
<sec id="s1">
<title>Introduction</title>
<p>Liver cancer is a common malignancy with morbidity and mortality ranking sixth and fourth, respectively. (<xref ref-type="bibr" rid="B5">Bray et&#x20;al., 2018</xref>). Surgical resection is the most common treatment method for liver cancer. However, the high recurrence and metastasis rate of liver cancer patients after resection poses a great challenge to liver cancer treatment. According to statistics, the recurrence rate of liver cancer patients 3&#xa0;years after surgery is approximately 40&#x2013;50%, and the recurrence rate 5&#xa0;years after surgery is as high as 60&#x2013;70%. (<xref ref-type="bibr" rid="B33">Nakayama and Takayama, 2014</xref>). Therefore, it is of great clinical significance to identify high-risk patients with recurrence of liver cancer after radical surgical resection.</p>
<p>With the development of high-throughput sequencing technology, some molecular biomarkers have been reported to predict liver cancer recurrence after hepatectomy. In previous studies, Erb-B2 receptor tyrosine kinase 2 (<italic>ERBB2)</italic> and NUF2 component of the NDC80 Kinetochore Complex (<italic>NUF2)</italic> were reported to be biomarkers of hepatocellular carcinoma (HCC) recurrence after surgery. (<xref ref-type="bibr" rid="B30">Li et&#x20;al., 2017a</xref>), (<xref ref-type="bibr" rid="B12">Feng et&#x20;al., 2021</xref>) D. Wang et&#x20;al. (<xref ref-type="bibr" rid="B7">Chen et&#x20;al., 2020</xref>) demonstrated that the level of interleukin 11 (<italic>IL11</italic>) increased after hepatectomy, which led to the growth of HCC. Zhou et&#x20;al. (<xref ref-type="bibr" rid="B9">Chen et&#x20;al., 2021</xref>) confirmed that WNK lysine deficient protein kinase 2 (<italic>WNK2)</italic> is a driving factor of HCC and a risk factor for early recurrence through genome sequencing. However, due to the complex etiology of liver cancer (such as hepatitis virus infection, alcohol-related liver disease, nonalcoholic fatty liver) and the difficulty of collecting liver cancer samples with a history of recurrence after hepatectomy, the predictive effect of individual genes screened from a limited number of samples in previous studies may be limited and may not be generally applicable to liver cancer caused by different etiologies. Our study included 306 liver cancer samples caused by different etiologies from The Cancer Genome Atlas, which is the largest sample size that can be incorporated with both recurrent disease history and sequencing data currently, improving the reliability of prediction.</p>
<p>Machine learning is a mathematical method for finding patterns in data to achieve artificial intelligence, and is now widely used in medical image detection and medical aid diagnosis. (<xref ref-type="bibr" rid="B30">Li et&#x20;al., 2017a</xref>; <xref ref-type="bibr" rid="B7">Chen et&#x20;al., 2020</xref>; <xref ref-type="bibr" rid="B9">Chen et&#x20;al., 2021</xref>; <xref ref-type="bibr" rid="B12">Feng et&#x20;al., 2021</xref>). Some studies have used machine learning methods to predict the recurrence of liver cancer. Ho et&#x20;al.(<xref ref-type="bibr" rid="B16">Ho et&#x20;al., 2006</xref>) constructed a KNN model based on 18 patients to predict HCC recurrence after resection. Liang et&#x20;al. (<xref ref-type="bibr" rid="B31">Liang et&#x20;al., 2014</xref>) analyzed 83 patients with HCC after radio frequency ablation and constructed an SVM model to predict HCC recurrence. However, it is worth noting that KNN and SVM have good predictive performance, but they are commonly used to solve classification problems and are not very explanatory for variables. Random forest in machine learning is an ensemble classifier, and the tree-based ensemble makes it suitable for handling with redundant features. (<xref ref-type="bibr" rid="B39">Reif et&#x20;al., 2006</xref>). Unlike KNN, SVM and random forest, logistic regression is a regression analysis that gives formulaic results to quantify the probability of event occurrence, with good interpretation of variables. (<xref ref-type="bibr" rid="B35">Nick and Campbell, 2007</xref>).</p>
<p>In our study, we aimed to identify potential biomarkers of liver cancer recurrence after resection, and construct a model to quantify the risk of recurrence based on the biomarkers. The above advantages of logistic regression make it a suitable algorithm for our study. In order to solve the problem that logistic regression is difficult to handle with high-dimensional variables, we performed random forest to screen variables. The model constructed using this combined method allows for the quantification of the risk of liver cancer recurrence and good predictive performance.</p>
</sec>
<sec sec-type="materials|methods" id="s2">
<title>Materials and Methods</title>
<sec id="s2-1">
<title>Patient Selection</title>
<p>The RNA-seq data and clinical data of samples with liver cancer were downloaded from The Cancer Genome Atlas database (<ext-link ext-link-type="uri" xlink:href="https://portal.gdc.cancer.gov/">https://portal.gdc.cancer.gov/</ext-link>). The detailed clinical data included age, sex, TNM stage, histologic grade, and recurrence (<xref ref-type="sec" rid="s10">Supplementary Table S1</xref>). Each file downloaded was the mRNA expression data of one sample, and we collated all sample data into one file to obtain an mRNA expression matrix of all samples, while matching the clinical information to the corresponding samples. The inclusion criteria for the cohort were as follows: 1) Normal tissue samples were removed. 2) Samples with R0 excision were selected for further analyses. Next, according to whether new tumor events occurred after the initial treatment, the patients were divided into recurrence and non-recurrence groups. Patients who had a new tumor event after the initial treatment and the type of new tumor event were intrahepatic recurrence, locoregional recurrence, or extrahepatic recurrence were included in the recurrence group. Samples that did not develop new tumor events after the initial treatment were included in the non-recurrence group. Finally, 306 usable samples were obtained, including 158&#x20;non-recurrent and 148 recurrent samples. The clinical characteristics of the recurrence and non-recurrence groups are shown in <xref ref-type="sec" rid="s10">Supplementary Table&#x20;S2</xref>.</p>
<p>In the subsequent analysis, the samples were further divided into two subgroups based on etiology: the alcohol-associated liver disease subgroup (ALD, n &#x3d; 57) and the hepatitis virus infection-related subgroup (HVI, n &#x3d; 98). The HVI subgroup included those associated with hepatitis B virus (HBV, n &#x3d; 71) and hepatitis C virus (HCV, n &#x3d; 27) infections. Considering the small sample size of HCV, HCV and HBV were not split into two subgroups and were uniformly classified as the HVI subgroup. The remaining patients (n &#x3d; 151) were not included in the subgroup analysis due to missing etiologies.</p>
</sec>
<sec id="s2-2">
<title>Screening of DE-mRNAs</title>
<p>DESeq and EdgeR packages in R software (<ext-link ext-link-type="uri" xlink:href="https://www.r-project.org/">https://www.r-project.org/</ext-link>) were used to screen DE-mRNAs between the recurrence and non-recurrence groups. The threshold was set at <italic>p</italic>&#x20;&#x3c; 0.05, and &#x7c;log2 (fold change)&#x7c;&#x3e;1. Overlapping DE-mRNAs screened using the two packages were used for further analyses.</p>
</sec>
<sec id="s2-3">
<title>Functional Enrichment and Co-expression Network</title>
<p>Gene Ontology (GO) functional enrichment of these DE-mRNAs was conducted using the database for annotation, visualization, and integrated discovery (<ext-link ext-link-type="uri" xlink:href="https://david.ncifcrf.gov/">https://david.ncifcrf.gov/</ext-link>), and <italic>p</italic>&#x20;&#x3c; 0.05, was set as the cutoff value. The co-expression network between DE-mRNAs was predicted using the STRING database (<ext-link ext-link-type="uri" xlink:href="https://string-db.org/">https://string-db.org/</ext-link>) and visualized using Cytoscape (<ext-link ext-link-type="uri" xlink:href="https://cytoscape.org/">https://cytoscape.org/</ext-link>).</p>
</sec>
<sec id="s2-4">
<title>Estimation of Immune Cells and Identification of Differential Immune Cells</title>
<p>Based on the mRNA expression levels of the recurrence and non-recurrence groups, we used the TIMER database (<ext-link ext-link-type="uri" xlink:href="http://timer.cistrome.org/">http://timer.cistrome.org/</ext-link>) to estimate the expression of immune cells in the two groups.</p>
</sec>
<sec id="s2-5">
<title>Development of the Risk Assessment Model</title>
<p>The overall flow chart of this study was shown in <xref ref-type="sec" rid="s10">Supplementary Figure S1</xref>. 306 patients were assigned to the training cohort (n &#x3d;&#x20;215) or validation cohort (n &#x3d; 91) with a 7:3 split ratio by applying simple random sampling. In the training cohort, 60&#x20;DE-mRNAs were entered into random forest (RF) as variables. RF is an ensemble method based on multiple decision trees, and the decision trees in RF are built by randomly selected samples made from bootstrap and a randomly selected subset of variables. Some original samples were not selected to construct trees, which are called out-of-bag (OOB) dataset. (<xref ref-type="bibr" rid="B6">Breiman, 2001</xref>). After inputting 60 variables into RF, mean decrease accuracy (MDA) and mean decrease Gini (MDG) provided in RF were calculated to assess the importance scores of each variable for liver cancer recurrence. MDA quantifies the importance of a variable by calculating the mean decrease accuracy in the OOB before and after the permutation of the variable, and MDG quantifies the importance of a variable by measuring the mean decrease in Gini impurity caused by the variable when it is used to form a split in the random forest. (<xref ref-type="bibr" rid="B11">D&#xed;az-Uriarte and de Andr&#xe9;s, 2006</xref>; <xref ref-type="bibr" rid="B47">Wang et&#x20;al., 2016</xref>). These were achieved by the &#x201c;randomForest&#x201d; package in R software. Next, a variable ranking was obtained by ranking the importance scores. Larger values of the importance scores represented greater influence of DE-mRNAs on recurrence. The variable ranking can be described as:<disp-formula id="equ1">
<mml:math id="m1">
<mml:mrow>
<mml:msub>
<mml:mi>X</mml:mi>
<mml:mrow>
<mml:mi>R</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>n</mml:mi>
<mml:mi>k</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:msup>
<mml:mi>x</mml:mi>
<mml:mrow>
<mml:mi>r</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msup>
<mml:mo>,</mml:mo>
<mml:msup>
<mml:mi>x</mml:mi>
<mml:mrow>
<mml:mi>r</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mn>2</mml:mn>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msup>
<mml:mo>,</mml:mo>
<mml:mo>&#x22ef;</mml:mo>
<mml:mo>,</mml:mo>
<mml:msup>
<mml:mi>x</mml:mi>
<mml:mrow>
<mml:mi>r</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mi>d</mml:mi>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msup>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
</disp-formula>where <inline-formula id="inf1">
<mml:math id="m2">
<mml:mrow>
<mml:mo>&#xa0;</mml:mo>
<mml:mi>r</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mi>i</mml:mi>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mo>,</mml:mo>
<mml:mi>i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1,2</mml:mn>
<mml:mo>,</mml:mo>
<mml:mo>&#x22ef;</mml:mo>
<mml:mo>,</mml:mo>
<mml:mi>d</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> is the index of variable <inline-formula id="inf2">
<mml:math id="m3">
<mml:mrow>
<mml:msub>
<mml:mi>x</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> in the descending ranking. We took MDA as the importance scores to obtain the top 30 importance ranking of variables <inline-formula id="inf3">
<mml:math id="m4">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mi>X</mml:mi>
<mml:mo>&#x2dc;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>R</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>n</mml:mi>
<mml:mi>k</mml:mi>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>, and took MDG as the importance scores to obtain the top 30 importance ranking of variables <inline-formula id="inf4">
<mml:math id="m5">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mi>X</mml:mi>
<mml:mo>&#x2dc;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>R</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>n</mml:mi>
<mml:mi>k</mml:mi>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>. In order to obtain a small scale of variables and increase reliability, we took the intersection of the variables in <inline-formula id="inf5">
<mml:math id="m6">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mi>X</mml:mi>
<mml:mo>&#x2dc;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>R</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>n</mml:mi>
<mml:mi>k</mml:mi>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> and <inline-formula id="inf6">
<mml:math id="m7">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mi>X</mml:mi>
<mml:mo>&#x2dc;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>R</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>n</mml:mi>
<mml:mi>k</mml:mi>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> as the variables to be put into the risk assessment model, which can be presented as:<disp-formula id="equ2">
<mml:math id="m8">
<mml:mrow>
<mml:mi>X</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mi>X</mml:mi>
<mml:mo>&#x2dc;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>R</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>n</mml:mi>
<mml:mi>k</mml:mi>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2229;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mi>X</mml:mi>
<mml:mo>&#x2dc;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>R</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>n</mml:mi>
<mml:mi>k</mml:mi>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</disp-formula>
</p>
<p>After the above steps, 18&#x20;DE-mRNAs with important effects on liver cancer recurrence were obtained as the input variables for the risk assessment&#x20;model.</p>
<p>Multivariate logistic regression was used to construct the risk assessment model for liver cancer recurrence. The calculation formula of risk score can be presented as:<disp-formula id="equ3">
<mml:math id="m9">
<mml:mrow>
<mml:mi>R</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>s</mml:mi>
<mml:mi>k</mml:mi>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mi>s</mml:mi>
<mml:mi>c</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>e</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mfrac>
<mml:mn>1</mml:mn>
<mml:mrow>
<mml:mn>1</mml:mn>
<mml:mo>&#x2b;</mml:mo>
<mml:msup>
<mml:mtext>e</mml:mtext>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:msup>
<mml:mi>&#x3c9;</mml:mi>
<mml:mi>T</mml:mi>
</mml:msup>
<mml:mi>X</mml:mi>
<mml:mo>&#x2b;</mml:mo>
<mml:mi>b</mml:mi>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
</disp-formula>
</p>
<p>In our study, <inline-formula id="inf7">
<mml:math id="m10">
<mml:mi>X</mml:mi>
</mml:math>
</inline-formula> is the expression level of each DE-mRNA, and the parameters <inline-formula id="inf8">
<mml:math id="m11">
<mml:mi>&#x3c9;</mml:mi>
</mml:math>
</inline-formula> and <inline-formula id="inf9">
<mml:math id="m12">
<mml:mi>b</mml:mi>
</mml:math>
</inline-formula> can be learned from the training data. The parameter <inline-formula id="inf10">
<mml:math id="m13">
<mml:mi>&#x3c9;</mml:mi>
</mml:math>
</inline-formula> can be interpreted as the relative impact of each DE-mRNA in the recurrence of liver cancer. In the training cohort, 18&#x20;DE-mRNAs screened by random forest were entered into logistic regression, and the model was validated using the validation cohort.</p>
<p>In addition, a logistic regression model without variable screening (model 2), a logistic model with stepwise regression (model 3), and a logistic model with L1 regularization (model 4) were constructed for comparison. In model 2, a logistic regression model was constructed directly with 60&#x20;DE-mRNAs. Model 3 was constructed by stepwise logistic regression with Akaike information criterion (AIC) for feature selection, which is a classic variable selection method. (<xref ref-type="bibr" rid="B1">Agostini et&#x20;al., 2015</xref>; <xref ref-type="bibr" rid="B40">Sanchez-pinto et&#x20;al., 2018</xref>; <xref ref-type="bibr" rid="B19">Hu et&#x20;al., 2019</xref>).Model 4 added the L1 regularization term to the logistic regression, which can have a dimensionality reduction effect. (<xref ref-type="bibr" rid="B46">Tibshirani, 1996</xref>; <xref ref-type="bibr" rid="B48">Wang et&#x20;al., 2014</xref>). The &#x201c;glmnet&#x201d; package in R software was used for the analyses. StromalScore, ImmuneScore, and ESTIMATEScore are three scores used to assess the level of infiltrating stromal and immune cells. (<xref ref-type="bibr" rid="B53">Yoshihara et&#x20;al., 2013</xref>). They were calculated to compare with the risk score presented in our study, using the &#x201c;estimate&#x201d; package in R software.</p>
</sec>
<sec id="s2-6">
<title>Performance Evaluation of the Prediction Models</title>
<p>The receiver operating characteristics (ROC) curve and the area under the ROC curve (AUC) were used to evaluate the performance of the models. As measures of model performance, they exhibit some desirable properties and are good ways to visualize model performance. (<xref ref-type="bibr" rid="B4">Bradley, 1997</xref>). In the field of big biological data and cancer-related research, ROC and AUC are widely used to evaluate the performance of machine learning models. (<xref ref-type="bibr" rid="B25">Le et&#x20;al., 2020</xref>; <xref ref-type="bibr" rid="B54">Yu et&#x20;al., 2020</xref>; <xref ref-type="bibr" rid="B24">Kudo et&#x20;al., 2021</xref>; <xref ref-type="bibr" rid="B26">Le et&#x20;al., 2021</xref>). ROC and AUC analyses were performed by R software.</p>
</sec>
<sec id="s2-7">
<title>Statistical Analysis</title>
<p>All statistical analyses were performed using GraphPad Prism version 8.0 software (GraphPad Software Inc.). A two-tailed <italic>t</italic>-test was used to identify immune cells that were significantly different between the recurrence and non-recurrence groups. In all analyses, a two-tailed <italic>p</italic>-value less than 0.05, was considered statistically significant. Random forest and logistic regression models were performed using R software (version 4.0.2). The codes for this study have been uploaded on GitHub (<ext-link ext-link-type="uri" xlink:href="https://github.com/polarbbbear/code">https://github.com/polarbbbear/code</ext-link>).</p>
</sec>
</sec>
<sec sec-type="results" id="s3">
<title>Results</title>
<sec id="s3-1">
<title>Identification of DE-mRNAs and the Link Between DE-mRNAs</title>
<p>The clinical information of the entire data, training data, and validation data are presented in <xref ref-type="sec" rid="s10">Supplementary Table S1</xref>. Kaplan-Meier curves indicated a significant difference in prognosis between the recurrence and non-recurrence groups (<xref ref-type="fig" rid="F1">Figure&#x20;1A</xref>). Using the edgeR and DESeq packages of R, 199 and 204 mRNAs that were significantly different between the recurrence and non-recurrence groups were identified, respectively (<xref ref-type="fig" rid="F1">Figures 1B, C</xref>). Next, 60 overlapping DE-mRNAs were obtained through the cross between the differentially expressed mRNAs identified by the edgeR package and DESeq package (<xref ref-type="fig" rid="F1">Figure&#x20;1D</xref>). To unveil the relationships among all DE-mRNAs, we constructed a network diagram of protein interactions by the string database (<xref ref-type="sec" rid="s10">Supplementary Figure S2A</xref>). In order of the ability to interact with the others, the top 10 genes were CEA Cell Adhesion Molecule 5 (<italic>CEACAM5</italic>), Mucin 1, Cell Surface Associated (<italic>MUC1</italic>), Cathepsin G (<italic>CTSG</italic>), Ret Proto-Oncogene (<italic>RET</italic>), CD79a Molecule (<italic>CD79A</italic>), Collagen Type XI Alpha 2 Chain (<italic>COL11A2</italic>), GLI Family Zinc Finger 2 (<italic>GLI2</italic>), Collagen Type X Alpha 1 Chain (<italic>COL10A1</italic>), Myosin Light Chain 3 (<italic>MYL3</italic>), Tectorin Beta (<italic>TECTB</italic>). Interestingly, we found that most of these key node genes play important roles in tumorigenesis (<italic>RET</italic>, <italic>CEACAM5</italic>), immune regulation (<italic>CTSG</italic>, <italic>CD79A</italic>) and the EMT pathway (<italic>COL10A1</italic>, <italic>COL11A2</italic>), suggesting their significant role in the recurrence of liver cancer. To quantify the interaction relationships between DE-mRNAs, we calculated the correlation of DE-mRNAs and found that many genes of the immunoglobulin superfamily were highly positively correlated (<xref ref-type="sec" rid="s10">Supplementary Figure S2B</xref>), such as genes of the Immunoglobulin Heavy Variable (IGHV) and Immunoglobulin Kappa Variable (IGKV) regions. The combination of these genes may co-regulate immune function in patients and affect the recurrence of liver cancer after surgery.</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption>
<p>Identification of DE-mRNAs <bold>(A)</bold> Kaplan-Meier curves of OS between the recurrence and non-recurrence groups across the entire dataset <bold>(B)</bold> DE-mRNAs that identified using the edgeR package <bold>(C)</bold> DE-mRNAs that identified using the DESeq package <bold>(D)</bold> Overlapping DE-mRNAs between the selection methods.</p>
</caption>
<graphic xlink:href="fgene-12-733654-g001.tif"/>
</fig>
</sec>
<sec id="s3-2">
<title>Functional Enrichment for mRNAs Co-expressed</title>
<p>To comprehensively study the potential mechanism of liver cancer recurrence, functional enrichment was performed in both groups. The results of the GO enrichment analysis are shown in <xref ref-type="fig" rid="F2">Figures 2A, B</xref>. It was noted that the DE-mRNAs between the two groups were significantly enriched in immune-related pathways such as antigen binding, Fc-gamma receptor signaling pathway involved in phagocytosis, regulation of immune response, immune response, immunoglobulin receptor binding, positive regulation of B&#x20;cell activation, B&#x20;cell receptor signaling pathway, immunoglobulin complex and circulating, innate immune response, and B&#x20;cell activation. Moreover, GSEA enrichment results showed that there were significant differences in the B&#x20;cell receptor signaling pathway, T&#x20;cell receptor signaling pathway, cell cycle, RNA polymerase, and DNA replication between the recurrence and non-recurrence groups. The B&#x20;cell receptor signaling pathway and the T&#x20;cell receptor signaling pathway-related genes were significantly enriched in the non-recurrence group, while the cell cycle, RNA polymerase, and DNA replication pathway-related genes were significantly enriched in the recurrence group (<xref ref-type="fig" rid="F2">Figures 2C&#x2013;G</xref>). These results suggested that the changes of immune-related functions may be the mechanism influencing liver cancer recurrence.</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption>
<p>Functional enrichment for mRNAs co-expressed <bold>(A)</bold> The bubble pattern shows the enrichment pathways with Gene Ratio, gene count and <italic>p</italic>-value <bold>(B)</bold> The histogram shows the enrichment of molecular function, biological process and cellular component. Results of GSEA enrichment on <bold>(C)</bold> B&#x20;cell receptor signaling pathway <bold>(D)</bold> T&#x20;cell receptor signaling pathway <bold>(E)</bold> Cell cycle <bold>(F)</bold> RNA polymerase, and <bold>(G)</bold> DNA replication.</p>
</caption>
<graphic xlink:href="fgene-12-733654-g002.tif"/>
</fig>
</sec>
<sec id="s3-3">
<title>Identification of Immune Cells With Significant Difference Between Two Groups</title>
<p>The results of functional enrichment suggested that there were significant differences in immune-related pathways between the recurrence and non-recurrence groups. In order to investigate which immune cells are involved in the mechanisms influencing the recurrence of liver cancer, we used the TIMER database (<ext-link ext-link-type="uri" xlink:href="http://timer.cistrome.org">http://timer.cistrome.org</ext-link>) to estimate the expression level of immune cells in the two groups, and the <italic>t</italic>-test was used to determine whether there were significant differences in the expression of immune cells between the two groups. Immune cells showed significant differences between the recurrence and non-recurrence groups (<xref ref-type="fig" rid="F3">Figures 3A&#x2013;D</xref>), and the expression of naive B&#x20;cells, B&#x20;cells, T&#x20;cell CD4<sup>&#x2b;</sup> memory resting, and T&#x20;cell CD4<sup>&#x2b;</sup> were downregulated in the recurrence group. The results demonstrated the significant influence of these four immune cells on liver cancer recurrence.</p>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption>
<p>Immune cells that are significantly different between the recurrence and non-recurrence groups <bold>(A)</bold> B&#x20;cell naive expression between the two groups <bold>(B)</bold> B&#x20;cell expression between the two groups <bold>(C)</bold> T&#x20;cell CD4<sup>&#x2b;</sup> memory resting expression between the two groups <bold>(D)</bold> T&#x20;cell CD4<sup>&#x2b;</sup> expression between the two groups.&#x2a;<italic>p</italic>&#x20;&#x3c; 0.05, &#x2a;&#x2a;<italic>p</italic>&#x20;&#x3c; 0.01 and &#x2a;&#x2a;&#x2a;<italic>p</italic>&#x20;&#x3c; 0.001.</p>
</caption>
<graphic xlink:href="fgene-12-733654-g003.tif"/>
</fig>
</sec>
<sec id="s3-4">
<title>Construction and Performance Evaluation of the Risk Assessment Model</title>
<p>To identify the mRNAs that play an important role in liver cancer recurrence, we constructed 500 decision trees using random forest with 60&#x20;DE-mRNAs as features and measured the importance of each DE-mRNA on recurrence by calculating the mean decrease Gini and mean decrease accuracy for each DE-mRNA. The top 30&#x20;DE-mRNAs ranked by mean decrease Gini and mean decrease accuracy were selected (<xref ref-type="fig" rid="F4">Figures 4A, B</xref>). The top 30 mRNAs were intersected, and 18 overlapping mRNAs were finally selected to construct the risk assessment model (<xref ref-type="fig" rid="F4">Figures 4C,&#x20;D</xref>).</p>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption>
<p>Construction of a risk assessment model <bold>(A)</bold> Top 30&#x20;DE-mRNAs with mean decrease Gini <bold>(B)</bold> Top 30&#x20;DE-mRNAs with mean decrease accuracy <bold>(C)</bold> Overlapping DE-mRNAs between the selection methods <bold>(D)</bold> Logistic risk model constructed by overlapping DE-mRNAs.</p>
</caption>
<graphic xlink:href="fgene-12-733654-g004.tif"/>
</fig>
<p>Subsequently, we trained an 18-mRNA risk assessment model in the training cohort using logistic regression analysis. These 18 mRNAs were uncharacterized LOC644135 (<italic>LOC644135),</italic> elastin (<italic>ELN),</italic> GULP PTB domain-containing engulfment adaptor 1 (<italic>GULP1)</italic>, <italic>ENSG00</italic>000248635 (a novel gene), Glycoprotein M6A (GPM6A), peptidase inhibitor 15 (PI15), Sphingosine-1-Phosphate phosphatase 2 (SGPP2), transmembrane protein 200C (TMEM200C), cadherin 3 (CDH3), selectin P (SELP), collagen and calcium binding EGF domains 1 (CCBE1), immunoglobulin lambda variable 1&#x2013;44 (IGLV1-44), Immunoglobulin Lambda Variable 2&#x2013;11 (IGLV2-11), Immunoglobulin Lambda Like Polypeptide 5 (IGLL5), Immunoglobulin Heavy Variable 3&#x2013;23 (IGHV3-23), Immunoglobulin Heavy Variable 5&#x2013;51 (IGHV5-51), Immunoglobulin Heavy Constant Gamma 2 (IGHG2), and CD79a molecule (CD79A). The risk assessment model was developed based on the coefficients of mRNAs and the constant derived from this analysis. The value of the constant b in the logistic regression formula was 0.3883, and the coefficients of mRNAs were shown in <xref ref-type="fig" rid="F4">Figure&#x20;4D</xref>.</p>
<p>In the training cohort, the performance of the risk assessment model was good, with an AUC value of 0.7356 (<xref ref-type="fig" rid="F5">Figures 5A, B</xref>). Subsequently, we assessed the robustness and accuracy of this 18-mRNA signature by applying the same statistical model to the validation cohort. In the validation cohort, the 18-mRNA biomarkers also showed significant diagnostic accuracy in identifying postoperative recurrence in patients with liver cancer, with an AUC value of 0.7285 (<xref ref-type="fig" rid="F5">Figures 5C,&#x20;D</xref>).</p>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption>
<p>Performance evaluation of the risk assessment model.The ROC curves demonstrate the diagnostic performance of the model in distinguishing recurrent patients in the <bold>(A)</bold> training cohort and <bold>(C)</bold> validation cohort. The histograms show the risk score distribution in the <bold>(B)</bold> training and <bold>(D)</bold> validation cohorts. For convenience of display, the risk score is subtracted from the median and magnified 10&#x20;times to obtain the modified risk&#x20;score.</p>
</caption>
<graphic xlink:href="fgene-12-733654-g005.tif"/>
</fig>
<p>Liver cancer is multi-centric and is significantly affected by background diseases. Different disease backgrounds may have influenced the results of the model. Therefore, we tried to verify whether the 18-mRNA signature can show good predictive performance in different etiological sources of liver cancer subgroups. Restricted by limited etiological data on patients, we could only divide the samples into ALD (n &#x3d; 57) and HVI (n &#x3d; 98) subgroups. Within the ALD subgroup, we randomly re-divided the training and validation cohorts in a 7:3 ratio and reconstructed a logistic model with the 18 mRNAs based on the training cohort to predict recurrence in patients in the ALD group and validated them in the validation cohort. The same procedure was performed for the HVI subgroup. These were executed to reduce the effect of background disease on the prediction results of the 18 mRNAs. In both subgroups, the 18-mRNA logistic regression models exhibited good and similar predictive performances. In the ALD subgroup, the AUC values of the 18-mRNA model were 0.8107 and 0.7273 on the training and validation sets, respectively. In the HVI subgroup, the AUC values were 0.8795 and 0.7764 for the training and validation sets, respectively (<xref ref-type="sec" rid="s10">Supplementary Figure S3A&#x2013;D</xref>). In summary, the 18-mRNA signature performed well in predicting liver cancer of different etiological sources (viral infection and alcohol-related), suggesting that our predictive markers may be universally applicable for predicting the recurrence of liver cancer from different etiological sources.</p>
<p>In order to form a comparison with the logistic regression model constructed by the above method, we used two other variable screening methods and constructed three different logistic models: a logistic regression model without variable filtering (model 2), a logistic regression model with variable filtering by stepwise regression (model 3), and a logistic regression model with variable filtering by L1 regularization (model 4). The prediction results of these three models are good in the training set, but the results in the validation set are much worse than those in the training set (<xref ref-type="sec" rid="s10">Supplementary Figure S4A&#x2013;F</xref>), that is, the models constructed by the three methods show serious overfitting. In contrast, the logistic model constructed after filtering with the random forest algorithm showed similar results and good predictions for both the training and validation cohorts.</p>
<p>We also compared the risk score with the StromalScore, ImmuneScore, and ESTIMATEScore. The StromalScore, ImmuneScore, and ESTIMATEScore were calculated based on the expressions of mRNAs. In the training set, the AUC values of the StromalScore, ImmuneScore, and ESTIMATEScore for predicting recurrence of liver cancer were 0.5581, 0.5599, and 0.5643, respectively, and 0.5923, 0.5942 and 0.5948 in the validation set, respectively (<xref ref-type="sec" rid="s10">Supplementary Figure S5A&#x2013;F</xref>). This indicated that the risk score proposed in our study had better performance in predicting the recurrence of liver cancer compared to StromalScore, ImmuneScore, and ESTIMATEScore.</p>
</sec>
<sec id="s3-5">
<title>Correlation Between Risk Score and Immune Cells</title>
<p>The previous analysis results showed that the recurrence of liver cancer after surgery was significantly associated with the expression of immune cells. Furthermore, to confirm the relationship between the risk of recurrence and immune infiltration, we performed correlation analysis between the recurrence risk score estimated using the previously established risk assessment model and immune cells. In the training cohort, B&#x20;cell naive, B&#x20;cell, T&#x20;cell CD4<sup>&#x2b;</sup> memory resting, and T&#x20;cell CD4<sup>&#x2b;</sup> expression levels were significantly negatively correlated with the risk score (<xref ref-type="fig" rid="F6">Figures 6A&#x2013;D</xref>). The negative association between these immune cells and the risk score was also verified in the validation cohort (<xref ref-type="fig" rid="F6">Figures 6E&#x2013;H</xref>). The results demonstrated the validity of the risk score predicted by the 18-mRNA model and further confirmed the negative association between these four immune cells and postoperative recurrence of liver cancer.</p>
<fig id="F6" position="float">
<label>FIGURE 6</label>
<caption>
<p>Correlation between risk scores and immune cells.Correlation between risk score and <bold>(A)</bold> B&#x20;cell naive <bold>(B)</bold> B&#x20;cell <bold>(C)</bold> T&#x20;cell CD4<sup>&#x2b;</sup> memory resting <bold>(D)</bold> T&#x20;cell CD4<sup>&#x2b;</sup> in the training data. Correlation between risk score and <bold>(E)</bold> B&#x20;cell naive <bold>(F)</bold> B&#x20;cell <bold>(G)</bold> T&#x20;cell CD4<sup>&#x2b;</sup> memory resting <bold>(H)</bold> T&#x20;cell CD4<sup>&#x2b;</sup> in the validation data. For convenience of display, the risk score is subtracted from the median and magnified 10&#x20;times to obtain the modified risk score. &#x2a;<italic>p</italic>&#x20;&#x3c; 0.05, &#x2a;&#x2a;<italic>p</italic>&#x20;&#x3c; 0.01 and &#x2a;&#x2a;&#x2a;<italic>p</italic>&#x20;&#x3c; 0.001.</p>
</caption>
<graphic xlink:href="fgene-12-733654-g006.tif"/>
</fig>
</sec>
<sec id="s3-6">
<title>Prognostic Analysis Using the Risk Scores in the Training and Validation Sets</title>
<p>To improve the clinical prognostic significance of the risk score, we then grouped patients by risk score and performed Kaplan-Meier survival analysis. X-tile software was used to obtain the best truncation value, and patients in the training cohort were divided into low-risk and high-risk groups (<xref ref-type="fig" rid="F7">Figures 7A, B</xref>). We observed a significant difference in overall survival (OS) between the low-risk and high-risk groups in the training cohort (<italic>p</italic>&#x20;&#x3d; 0.0235) (<xref ref-type="fig" rid="F7">Figure&#x20;7C</xref>). Similarly, in the validation cohort, there was a significant difference in the prognosis between the high- and low-risk groups classified by the X-tile software (<italic>p</italic>&#x20;&#x3d; 0.0097) (<xref ref-type="fig" rid="F7">Figures 7D&#x2013;F</xref>). The results indicated that risk score had good prognostic value for liver cancer patients.</p>
<fig id="F7" position="float">
<label>FIGURE 7</label>
<caption>
<p>Prognostic analysis using the risk scores in the training and validation sets. Optimal cutoff value of the risk score divided by X-tile software in the training data <bold>(A, B) (C)</bold> Kaplan-Meier curve of the two groups divided by the cutoff value in the training data. The optimal cutoff value of the risk score was divided by the X-tile software in the validation data <bold>(D, E) (F)</bold> Kaplan-Meier curve of the two groups divided by the cutoff value in the validation data. &#x2a;<italic>p</italic>&#x20;&#x3c; 0.05, &#x2a;&#x2a;<italic>p</italic>&#x20;&#x3c; 0.01 and &#x2a;&#x2a;&#x2a;<italic>p</italic>&#x20;&#x3c; 0.001.</p>
</caption>
<graphic xlink:href="fgene-12-733654-g007.tif"/>
</fig>
</sec>
<sec id="s3-7">
<title>Univariate and Multivariate Analyses of the mRNA Signature Prognostic Abilities</title>
<p>To verify the prognostic value of the 18-mRNA signature independently from the clinicopathological characteristics, we performed Cox univariate and multivariate analyses that included 18-mRNA risk score, age, sex, histologic grade, and TNM stage as co-variables in the training and validation cohorts. In univariate and multivariate analyses of the training cohort, TMN stage was found to be related to OS (<xref ref-type="sec" rid="s10">Supplementary Figure S6A&#x2013;B</xref>). However, in univariate and multivariate analyses of the validation cohort, the TMN stage was no longer significantly correlated with OS, and the risk score was a significant variable related to OS (<xref ref-type="sec" rid="s10">Supplementary Figure S6C&#x2013;D</xref>). HR values of the risk score were significant but not high, which was not perfect in clinical prognosis prediction. In addition, histologic grade and TMN stage appeared to have high but not significant HR values, which may be due to excessive standard errors of the variables. (<xref ref-type="bibr" rid="B22">Katz and Hauck, 1993</xref>).</p>
</sec>
</sec>
<sec sec-type="discussion" id="s4">
<title>Discussion</title>
<p>In this study, we constructed a risk scoring model with 18 mRNAs to predict post-hepatectomy recurrence of liver cancer. The 18 mRNAs were LOC644135, ELN, GULP1, ENSG00000248635, GPM6A, PI15, SGPP2, TMEM200C, CDH3, SELP, CCBE1, IGLV1-44, IGLV2-11, IGLL5, IGHV3-23, IGHV5-51, IGHG2, and CD79A.The risk assessment model could accurately distinguish between low- and high-risk samples for the recurrence of liver cancer after resection, with good prognostic performance. The identified 18 mRNAs also had good predictive performance in liver cancer samples caused by different etiologies. B&#x20;cell naive, B&#x20;cell, T&#x20;cell CD4<sup>&#x2b;</sup> memory resting, and T&#x20;cell CD4<sup>&#x2b;</sup> were significantly different in recurrence versus non-recurrence liver cancer samples and were found to be negatively correlated with the risk scores predicted by the constructed model by correlation analysis.</p>
<p>Compared to the classification algorithms in machine learning, regression analysis has better explanatory power for variables. The advantage of our method is that it combines random forest with regression analysis to screen biomarkers of liver cancer recurrence and construct a formulaic risk assessment model of liver cancer recurrence, which ensures the interpretability of variables with good predictive performance. We also constructed a logistic regression model without feature screening, a stepwise regression logistic model, and an L1 regularized logistic model, which revealed that the random forest-based logistic regression model had better generalization performance on the validation set. Meanwhile, compared to StromalScore, ImmuneScore, and ESTIMATEScore, our risk score showed better performance to predict recurrence risk of liver cancer.</p>
<p>In previous studies, machine learning methods have also been used to predict liver cancer recurrence. Wang et&#x20;al.(<xref ref-type="bibr" rid="B49">Wang et&#x20;al., 2020</xref>) used lasso and Cox regressions to screen five mRNAs to predict HCC recurrence, and the predicted AUC values for 1-year, 2-year, and 3-year RFS rates from the independent validation data were 0.752, 0.651, and 0.677, respectively. Iizuka et&#x20;al.(<xref ref-type="bibr" rid="B21">Iizuka et&#x20;al., 2003</xref>) used Fisher&#x2019;s linear classifier algorithm to predict intrahepatic recurrence in hepatocellular carcinoma patients within 1&#xa0;year after resection, using 18 mRNAs. In the validation sample, the predictive accuracy was 92.6% (25/27). Based on this, Somura et&#x20;al.(<xref ref-type="bibr" rid="B41">Somura et&#x20;al., 2008</xref>) selected three of the mRNAs and constructed a prediction model with the same algorithm, with a correct prediction accuracy of 81.4% (35/43) in the validation set. However, selection bias or publication bias in the small sample sizes may produce inflated over-promising results. (<xref ref-type="bibr" rid="B36">Ntzani and Ioannidis, 2003</xref>). In addition, a few previous studies have used a large number of genetic biomarkers to predict the prognosis of liver cancer. (<xref ref-type="bibr" rid="B27">Lee et&#x20;al., 2006</xref>; <xref ref-type="bibr" rid="B17">Hoshida et&#x20;al., 2008</xref>; <xref ref-type="bibr" rid="B50">Woo et&#x20;al., 2008</xref>). However, due to the different sample selection criteria and definition of the outcomes, there was little gene overlap between these studies. To our knowledge, the present study includes the largest sample size through the machine learning method compared to other studies in HCC recurrence prediction, which may enhance the validity of the gene signature predicted by our study. Our screened 18 mRNAs showed good performance in predicting liver cancer recurrence, with AUCs of 0.7356 and 0.7285 in the training and validation cohorts, respectively.</p>
<p>We report for the first time that LOC644135, ELN, GULP1, ENSG00000248635, GPM6A, and PI15 are associated with the risk of liver cancer recurrence. In addition, some genes that we identified have been reported to play a role in the development, recurrence, and metastasis of cancer in previous studies. It has been reported that Nudix hydrolase 21 promotes tumor growth and metastasis through modulating SGPP2 in gastric cancer. (<xref ref-type="bibr" rid="B57">Zhu et&#x20;al., 2021</xref>). TMEM200C is reported to be hypomethylated, and candidate oncogenes linked to early metastasis in uveal melanoma. (<xref ref-type="bibr" rid="B34">Ness et&#x20;al., 2021</xref>). CDH3, a classical cell adhesion molecule, has been reported to be related to a variety of human cancers. L. Li et&#x20;al. (<xref ref-type="bibr" rid="B29">Li et&#x20;al., 2019</xref>) found that Kruppel-like factor 4 (KLF4)-mediated upregulation of CDH3 inhibits the growth and migration of human hepatoma cells through GSK-3 <inline-formula id="inf11">
<mml:math id="m14">
<mml:mi>&#x3b2;</mml:mi>
</mml:math>
</inline-formula> signaling. Overexpression of CDH3 has been reported to promote the movement of pancreatic cancer cells by interacting with P120ctn and activating Rho family GTPases. (<xref ref-type="bibr" rid="B45">Taniuchi et&#x20;al., 2005</xref>). CDH3 has also been reported to be associated with prognosis in patients with colorectal adenocarcinoma and lung cancer. (<xref ref-type="bibr" rid="B51">Xu et&#x20;al., 2019</xref>; <xref ref-type="bibr" rid="B18">Hsiao et&#x20;al., 2020</xref>). SELP is a member of the selectin family of cell adhesion molecules, and it mediates heterotypic aggregation of activated platelets to cancer cells and adhesion of cancer cells to stimulated endothelial cells. (<xref ref-type="bibr" rid="B8">Chen and Geng, 2006</xref>). It has been demonstrated that SELP plays an important role in the growth and metastasis of human colon carcinoma <italic>in vivo</italic>. (<xref ref-type="bibr" rid="B23">Kim et&#x20;al., 1998</xref>). CCBE1 is essential in lymphatic vascular development. Song et&#x20;al.(<xref ref-type="bibr" rid="B42">Song et&#x20;al., 2020</xref>) demonstrated the procarcinogenic role of CCBE1 in promoting lymphangiogenesis and metastasis in colorectal cancer, and it has been reported that targeting of CCBE1 by miR-330-3p promotes tumor metastasis in breast cancer. (<xref ref-type="bibr" rid="B32">Mesci et&#x20;al., 2017</xref>). Our results contribute to further understanding of the impact of these genes on recurrence of liver cancer. It is interesting to note that many of the genes we report are immunoglobulin genes (IGLV1-44, IGLV2-11, IGLL5, IGHV3-23, IGHV5-51, IGHG2). Previous studies have shown that some immunoglobulins regulate the tumor microenvironment and influence the prognosis of patients with breast cancer, diffuse large B-cell lymphoma, and chronic lymphocytic leukemia (<xref ref-type="bibr" rid="B2">Baliakas et&#x20;al., 2015</xref>; <xref ref-type="bibr" rid="B55">Zhang et&#x20;al., 2015</xref>; <xref ref-type="bibr" rid="B43">Stamatopoulos et&#x20;al., 2018</xref>; <xref ref-type="bibr" rid="B52">Xu-Monette et&#x20;al., 2019</xref>), and our results suggest that the above immunoglobulin genes may play an important role in recurrence of liver cancer. CD79A is also an immune function-related gene. CD79A and CD79b molecule (CD79B) heterodimers are important signaling components of the B&#x20;cell receptor (BCR) complex, which plays a crucial role in B&#x20;cell development and antibody production. (<xref ref-type="bibr" rid="B28">Li et&#x20;al., 2017b</xref>). These immune-related genes identified in our study may provide insights into the underlying mechanism of liver cancer recurrence.</p>
<p>Previous studies have reported that immune cells play a role in cancer recurrence. (<xref ref-type="bibr" rid="B3">Bindea et&#x20;al., 2013</xref>; <xref ref-type="bibr" rid="B10">Chevalier et&#x20;al., 2017</xref>; <xref ref-type="bibr" rid="B56">Zhou et&#x20;al., 2019</xref>). The enrichment results showed that DE-mRNAs were enriched in many immune-related pathways. Therefore, on the basis of predicting liver cancer recurrence, we analyzed the differences in immune cells between patients with and without recurrence, and explored the relationship between the predicted risk of recurrence and differential immune cells in patients with liver cancer. We demonstrated that compared with the non-recurrence group, B&#x20;cell naive, B&#x20;cell, T&#x20;cell CD4<sup>&#x2b;</sup> memory resting, and T&#x20;cell CD4<sup>&#x2b;</sup> were significantly downregulated in the recurrence group and were inversely associated with the recurrence risk evaluated by the model we built. Previous studies have shown that tumor metastasis is associated with the presence of CD4<sup>&#x2b;</sup> T&#x20;cells and B&#x20;cells. Olkhanud et&#x20;al. (<xref ref-type="bibr" rid="B37">Olkhanud et&#x20;al., 2011</xref>) found that tumor-evoked regulatory B&#x20;cells promote breast cancer metastasis by converting resting CD4<sup>&#x2b;</sup> T&#x20;cells to T-regulatory cells. Ou et&#x20;al.(<xref ref-type="bibr" rid="B38">Ou et&#x20;al., 2015</xref>) found that tumor microenvironment B&#x20;cells increase bladder cancer metastasis via modulation of the IL-8/androgen receptor (AR)/MMPs signals. In addition, Guy et&#x20;al. (<xref ref-type="bibr" rid="B15">Guy et&#x20;al., 2016</xref>) found that tumor-specific CD4<sup>&#x2b;</sup> T&#x20;cells and B&#x20;cells play important functions and major roles in anticancer immunity. Many studies have shown that a variety of immunosuppressive signals regulate the tumor microenvironment, which plays an important regulatory role in the process of tumorigenesis, and its heterogeneity can lead to multiple aspects, including patient prognosis and treatment response. (<xref ref-type="bibr" rid="B13">Fridman et&#x20;al., 2012</xref>; <xref ref-type="bibr" rid="B14">Galon et&#x20;al., 2014</xref>; <xref ref-type="bibr" rid="B20">Hui and Chen, 2015</xref>). Sun et&#x20;al. (<xref ref-type="bibr" rid="B44">Sun et&#x20;al., 2021</xref>) reported that recurrent HCC has a unique immune ecosystem compared with the primary HCC tumor microenvironment. Therefore, our findings may provide a new approach for the immunotherapy of liver cancer recurrence.</p>
<p>In conclusion, the risk assessment model developed in this study may serve as a complementary tool to provide useful information for predicting disease outcomes after hepatectomy in patients with liver cancer and guide adjuvant therapy. Meanwhile, the immune cells reported in this study could be the targets of immunotherapy for patients with liver cancer. While these predictions are valuable, the current study has some limitations. The 18-mRNA biomarkers were screened by bioinformatics and machine learning methods, and their expression and specific functions need to be validated by biological experiments. In addition, the predictive performance of the 18-mRNA risk assessment model constructed in our study needs to be validated using large independent samples.</p>
</sec>
</body>
<back>
<sec id="s5">
<title>Data Availability Statement</title>
<p>The original contributions presented in the study are included in the article/<xref ref-type="sec" rid="s10">Supplementary Material</xref>, further inquiries can be directed to the corresponding authors.</p>
</sec>
<sec id="s6">
<title>Author Contributions</title>
<p>XQ and HZ designed the project. ZH, LZ and JW provided administrative, technical, and material support. XQ, KX, and ZC performed statistical analyses. XQ wrote the manuscript. HZ revised the paper. All authors reviewed the manuscript and agreed to its submission.</p>
</sec>
<sec id="s7">
<title>Funding</title>
<p>This study was supported by the Zhejiang Province Key Research and Development Projects (2020C03057, 2021C03145, 2020C03071) and the National Natural Science Foundation of China (Grant no. 61972358).</p>
</sec>
<sec sec-type="COI-statement" id="s8">
<title>Conflict of Interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="disclaimer" id="s9">
<title>Publisher&#x2019;s Note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<ack>
<p>We sincerely thank the researchers and study participants for their contributions toward this&#x20;study.</p>
</ack>
<sec id="s10">
<title>Supplementary Material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fgene.2021.733654/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fgene.2021.733654/full&#x23;supplementary-material</ext-link>
</p>
<supplementary-material xlink:href="Image5.PDF" id="SM1" mimetype="application/PDF" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Table1.PDF" id="SM2" mimetype="application/PDF" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Table2.PDF" id="SM3" mimetype="application/PDF" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Image6.PDF" id="SM4" mimetype="application/PDF" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Image4.PDF" id="SM5" mimetype="application/PDF" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Image2.PDF" id="SM6" mimetype="application/PDF" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Image3.PDF" id="SM7" mimetype="application/PDF" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Image1.PDF" id="SM8" mimetype="application/PDF" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Agostini</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Zangrando</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Pastrello</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>D&#x27;Angelo</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Romano</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Giovannoni</surname>
<given-names>R.</given-names>
</name>
<etal/>
</person-group> (<year>2015</year>). <article-title>A Functional Biological Network Centered on XRCC3: A New Possible Marker of Chemoradiotherapy Resistance in Rectal Cancer Patients</article-title>. <source>Cancer Biol. Ther.</source> <volume>16</volume>, <fpage>1160</fpage>&#x2013;<lpage>1171</lpage>. <pub-id pub-id-type="doi">10.1080/15384047.2015.1046652</pub-id> </citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Baliakas</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Agathangelidis</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Hadzidimitriou</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Sutton</surname>
<given-names>L.-A.</given-names>
</name>
<name>
<surname>Minga</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Tsanousa</surname>
<given-names>A.</given-names>
</name>
<etal/>
</person-group> (<year>2015</year>). <article-title>Not all IGHV3-21 Chronic Lymphocytic Leukemias Are Equal: Prognostic Considerations</article-title>. <source>Blood</source> <volume>125</volume>, <fpage>856</fpage>&#x2013;<lpage>859</lpage>. <pub-id pub-id-type="doi">10.1182/blood-2014-09-600874</pub-id> </citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bindea</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Mlecnik</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Tosolini</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Kirilovsky</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Waldner</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Obenauf</surname>
<given-names>A. C.</given-names>
</name>
<etal/>
</person-group> (<year>2013</year>). <article-title>Spatiotemporal Dynamics of Intratumoral Immune Cells Reveal the Immune Landscape in Human Cancer</article-title>. <source>Immunity</source> <volume>39</volume>, <fpage>782</fpage>&#x2013;<lpage>795</lpage>. <pub-id pub-id-type="doi">10.1016/j.immuni.2013.10.003</pub-id> </citation>
</ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bradley</surname>
<given-names>A. P.</given-names>
</name>
</person-group> (<year>1997</year>). <article-title>The Use of the Area under the ROC Curve in the Evaluation of Machine Learning Algorithms</article-title>. <source>Pattern Recognition</source> <volume>30</volume>, <fpage>1145</fpage>&#x2013;<lpage>1159</lpage>. <pub-id pub-id-type="doi">10.1016/s0031-3203(96)00142-2</pub-id> </citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bray</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Ferlay</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Soerjomataram</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Siegel</surname>
<given-names>R. L.</given-names>
</name>
<name>
<surname>Torre</surname>
<given-names>L. A.</given-names>
</name>
<name>
<surname>Jemal</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Global Cancer Statistics 2018: GLOBOCAN Estimates of Incidence and Mortality Worldwide for 36 Cancers in 185 Countries</article-title>. <source>CA: A Cancer J.&#x20;Clinicians</source> <volume>68</volume>, <fpage>394</fpage>&#x2013;<lpage>424</lpage>. <pub-id pub-id-type="doi">10.3322/caac.21492</pub-id> </citation>
</ref>
<ref id="B6">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Breiman</surname>
<given-names>L.</given-names>
</name>
</person-group> (<year>2001</year>). <article-title>Random Forests</article-title>. <source>Mach. Learn.</source> <volume>45</volume>, <fpage>5</fpage>&#x2013;<lpage>32</lpage>. <pub-id pub-id-type="doi">10.1023/a:1010933404324</pub-id> </citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Ying</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Gu</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Feng</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>T.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>A Transfer Learning Based Super-resolution Microscopy for Biopsy Slice Images: The Joint Methods Perspective</article-title>. <source>Ieee/acm Trans. Comput. Biol. Bioinf.</source> <volume>18</volume>, <fpage>1</fpage>. <pub-id pub-id-type="doi">10.1109/TCBB.2020.2991173</pub-id> </citation>
</ref>
<ref id="B8">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Geng</surname>
<given-names>J.-G.</given-names>
</name>
</person-group> (<year>2006</year>). <article-title>P-selectin Mediates Adhesion of Leukocytes, Platelets, and Cancer Cells in Inflammation, Thrombosis, and Cancer Growth and Metastasis</article-title>. <source>Arch. Immunol. Ther. Exp.</source> <volume>54</volume>, <fpage>75</fpage>&#x2013;<lpage>84</lpage>. <pub-id pub-id-type="doi">10.1007/s00005-006-0010-6</pub-id> </citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Feng</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Yuan</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Lu</surname>
<given-names>W.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Discriminative Cervical Lesion Detection in Colposcopic Images with Global Class Activation and Local Bin Excitation</article-title>. <source>IEEE J.&#x20;Biomed. Health Inform.</source> [<comment>in press</comment>]. <pub-id pub-id-type="doi">10.1109/JBHI.2021.3100367</pub-id> </citation>
</ref>
<ref id="B10">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chevalier</surname>
<given-names>M. F.</given-names>
</name>
<name>
<surname>Trabanelli</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Racle</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Salom&#xe9;</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Cesson</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Gharbi</surname>
<given-names>D.</given-names>
</name>
<etal/>
</person-group> (<year>2017</year>). <article-title>ILC2-modulated T&#x20;Cell-To-MDSC Balance Is Associated with Bladder Cancer Recurrence</article-title>. <source>J.&#x20;Clin. Invest.</source> <volume>127</volume>, <fpage>2916</fpage>&#x2013;<lpage>2929</lpage>. <pub-id pub-id-type="doi">10.1172/JCI89717</pub-id> </citation>
</ref>
<ref id="B11">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>D&#xed;az-Uriarte</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>de Andr&#xe9;s</surname>
<given-names>S. A.</given-names>
</name>
</person-group> (<year>2006</year>). <article-title>Gene Selection and Classification of Microarray Data Using Random forest</article-title>. <source>BMC Bioinformatics</source> <volume>7</volume>, <fpage>3</fpage>. <pub-id pub-id-type="doi">10.1186/1471-2105-7-3</pub-id> </citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Feng</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>D. Z.</given-names>
</name>
<name>
<surname>Gao</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>A Deep Learning Approach for Colonoscopy Pathology WSI Analysis: Accurate Segmentation and Classification</article-title>. <source>IEEE J.&#x20;Biomed. Health Inform.</source> <volume>25</volume>, <fpage>3700</fpage>&#x2013;<lpage>3708</lpage>. <pub-id pub-id-type="doi">10.1109/JBHI.2020.3040269</pub-id> </citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fridman</surname>
<given-names>W. H.</given-names>
</name>
<name>
<surname>Pag&#xe8;s</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Saut&#xe8;s-Fridman</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Galon</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>The Immune Contexture in Human Tumours: Impact on Clinical Outcome</article-title>. <source>Nat. Rev. Cancer</source> <volume>12</volume>, <fpage>298</fpage>&#x2013;<lpage>306</lpage>. <pub-id pub-id-type="doi">10.1038/nrc3245</pub-id> </citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Galon</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Mlecnik</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Bindea</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Angell</surname>
<given-names>H. K.</given-names>
</name>
<name>
<surname>Berger</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Lagorce</surname>
<given-names>C.</given-names>
</name>
<etal/>
</person-group> (<year>2014</year>). <article-title>Towards the Introduction of the &#x27;Immunoscore&#x27; in the Classification of Malignant Tumours</article-title>. <source>J.&#x20;Pathol.</source> <volume>232</volume>, <fpage>199</fpage>&#x2013;<lpage>209</lpage>. <pub-id pub-id-type="doi">10.1002/path.4287</pub-id> </citation>
</ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Guy</surname>
<given-names>T. V.</given-names>
</name>
<name>
<surname>Terry</surname>
<given-names>A. M.</given-names>
</name>
<name>
<surname>Bolton</surname>
<given-names>H. A.</given-names>
</name>
<name>
<surname>Hancock</surname>
<given-names>D. G.</given-names>
</name>
<name>
<surname>Zhu</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Brink</surname>
<given-names>R.</given-names>
</name>
<etal/>
</person-group> (<year>2016</year>). <article-title>Collaboration between Tumor-specific CD4&#x2b; T&#x20;Cells and B&#x20;Cells in Anti-cancer Immunity</article-title>. <source>Oncotarget</source> <volume>7</volume>, <fpage>30211</fpage>&#x2013;<lpage>30229</lpage>. <pub-id pub-id-type="doi">10.18632/oncotarget.8797</pub-id> </citation>
</ref>
<ref id="B16">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ho</surname>
<given-names>M.-C.</given-names>
</name>
<name>
<surname>Lin</surname>
<given-names>J.-J.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>C.-N.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>C.-C.</given-names>
</name>
<name>
<surname>Lee</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>C.-Y.</given-names>
</name>
<etal/>
</person-group> (<year>2006</year>). <article-title>A Gene Expression Profile for Vascular Invasion Can Predict the Recurrence after Resection of Hepatocellular Carcinoma: A Microarray Approach</article-title>. <source>Ann. Surg. Oncol.</source> <volume>13</volume>, <fpage>1474</fpage>&#x2013;<lpage>1484</lpage>. <pub-id pub-id-type="doi">10.1245/s10434-006-9057-1</pub-id> </citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hoshida</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Villanueva</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Kobayashi</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Peix</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Chiang</surname>
<given-names>D. Y.</given-names>
</name>
<name>
<surname>Camargo</surname>
<given-names>A.</given-names>
</name>
<etal/>
</person-group> (<year>2008</year>). <article-title>Gene Expression in Fixed Tissues and Outcome in Hepatocellular Carcinoma</article-title>. <source>N. Engl. J.&#x20;Med.</source> <volume>359</volume>, <fpage>1995</fpage>&#x2013;<lpage>2004</lpage>. <pub-id pub-id-type="doi">10.1056/NEJMoa0804525</pub-id> </citation>
</ref>
<ref id="B18">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hsiao</surname>
<given-names>T.-F.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>C.-L.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>Y.-C.</given-names>
</name>
<name>
<surname>Feng</surname>
<given-names>H.-P.</given-names>
</name>
<name>
<surname>Chiu</surname>
<given-names>Y.-C.</given-names>
</name>
<name>
<surname>Lin</surname>
<given-names>H.-Y.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Integrative Omics Analysis Reveals Soluble Cadherin-3 as a Survival Predictor and an Early Monitoring Marker of EGFR Tyrosine Kinase Inhibitor Therapy in Lung Cancer</article-title>. <source>Clin. Cancer Res.</source> <volume>26</volume>&#x2013;<lpage>3229</lpage>. <pub-id pub-id-type="doi">10.1158/1078-0432.CCR-19-3972</pub-id> </citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hu</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Shi</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>Y.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>A Clinical-Radiomics Nomogram for the Preoperative Prediction of Lung Metastasis in Colorectal Cancer Patients with Indeterminate Pulmonary Nodules</article-title>. <source>Eur. Radiol.</source> <volume>29</volume>, <fpage>439</fpage>&#x2013;<lpage>449</lpage>. <pub-id pub-id-type="doi">10.1007/s00330-018-5539-3</pub-id> </citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hui</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Tumor Microenvironment: Sanctuary of the Devil</article-title>. <source>Cancer Lett.</source> <volume>368</volume>, <fpage>7</fpage>&#x2013;<lpage>13</lpage>. <pub-id pub-id-type="doi">10.1016/j.canlet.2015.07.039</pub-id> </citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Iizuka</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Oka</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Yamada-Okabe</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Nishida</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Maeda</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Mori</surname>
<given-names>N.</given-names>
</name>
<etal/>
</person-group> (<year>2003</year>). <article-title>Oligonucleotide Microarray for Prediction of Early Intrahepatic Recurrence of Hepatocellular Carcinoma after Curative Resection</article-title>. <source>The Lancet</source> <volume>361</volume>, <fpage>923</fpage>&#x2013;<lpage>929</lpage>. <pub-id pub-id-type="doi">10.1016/S0140-6736(03)12775-4</pub-id> </citation>
</ref>
<ref id="B22">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Katz</surname>
<given-names>M. H.</given-names>
</name>
<name>
<surname>Hauck</surname>
<given-names>W. W.</given-names>
</name>
</person-group> (<year>1993</year>). <article-title>Proportional Hazards (Cox) Regression</article-title>. <source>J.&#x20;Gen. Intern. Med.</source> <volume>8</volume>, <fpage>702</fpage>&#x2013;<lpage>711</lpage>. <pub-id pub-id-type="doi">10.1007/bf02598295</pub-id> </citation>
</ref>
<ref id="B23">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kim</surname>
<given-names>Y. J.</given-names>
</name>
<name>
<surname>Borsig</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Varki</surname>
<given-names>N. M.</given-names>
</name>
<name>
<surname>Varki</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>1998</year>). <article-title>P-selectin Deficiency Attenuates Tumor Growth and Metastasis</article-title>. <source>Pnas</source> <volume>95</volume>, <fpage>9325</fpage>&#x2013;<lpage>9330</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.95.16.9325</pub-id> </citation>
</ref>
<ref id="B24">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kudo</surname>
<given-names>S.-e.</given-names>
</name>
<name>
<surname>Ichimasa</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Villard</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Mori</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Misawa</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Saito</surname>
<given-names>S.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Artificial Intelligence System to Determine Risk of T1 Colorectal Cancer Metastasis to Lymph Node</article-title>. <source>Gastroenterology</source> <volume>160</volume>, <fpage>1075</fpage>&#x2013;<lpage>1084</lpage>. <pub-id pub-id-type="doi">10.1053/j.gastro.2020.09.027</pub-id> </citation>
</ref>
<ref id="B25">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Le</surname>
<given-names>N. Q. K.</given-names>
</name>
<name>
<surname>Do</surname>
<given-names>D. T.</given-names>
</name>
<name>
<surname>Hung</surname>
<given-names>T. N. K.</given-names>
</name>
<name>
<surname>Lam</surname>
<given-names>L. H. T.</given-names>
</name>
<name>
<surname>Huynh</surname>
<given-names>T.-T.</given-names>
</name>
<name>
<surname>Nguyen</surname>
<given-names>N. T. K.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>A Computational Framework Based on Ensemble Deep Neural Networks for Essential Genes Identification</article-title>. <source>Ijms</source> <volume>21</volume>, <fpage>9070</fpage>. <pub-id pub-id-type="doi">10.3390/ijms21239070</pub-id> </citation>
</ref>
<ref id="B26">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Le</surname>
<given-names>N. Q. K.</given-names>
</name>
<name>
<surname>Hung</surname>
<given-names>T. N. K.</given-names>
</name>
<name>
<surname>Do</surname>
<given-names>D. T.</given-names>
</name>
<name>
<surname>Lam</surname>
<given-names>L. H. T.</given-names>
</name>
<name>
<surname>Dang</surname>
<given-names>L. H.</given-names>
</name>
<name>
<surname>Huynh</surname>
<given-names>T.-T.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Radiomics-based Machine Learning Model for Efficiently Classifying Transcriptome Subtypes in Glioblastoma Patients from MRI</article-title>. <source>Comput. Biol. Med.</source> <volume>132</volume>, <fpage>104320</fpage>. <pub-id pub-id-type="doi">10.1016/j.compbiomed.2021.104320</pub-id> </citation>
</ref>
<ref id="B27">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lee</surname>
<given-names>J.-S.</given-names>
</name>
<name>
<surname>Heo</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Libbrecht</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Chu</surname>
<given-names>I.-S.</given-names>
</name>
<name>
<surname>Kaposi-Novak</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Calvisi</surname>
<given-names>D. F.</given-names>
</name>
<etal/>
</person-group> (<year>2006</year>). <article-title>A Novel Prognostic Subtype of Human Hepatocellular Carcinoma Derived from Hepatic Progenitor Cells</article-title>. <source>Nat. Med.</source> <volume>12</volume>, <fpage>410</fpage>&#x2013;<lpage>416</lpage>. <pub-id pub-id-type="doi">10.1038/nm1377</pub-id> </citation>
</ref>
<ref id="B28">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>X.</given-names>
</name>
<etal/>
</person-group> (<year>2017</year>). <article-title>Molecular Characterization of the CD79a and CD79b and its Role against Aeromonas Hydrophila Infection in Chinese Sucker (<italic>Myxocyprinus asiaticus</italic>)</article-title>. <source>Fish. Physiol. Biochem.</source> <volume>43</volume>, <fpage>1571</fpage>&#x2013;<lpage>1585</lpage>. <pub-id pub-id-type="doi">10.1007/s10695-017-0394-8</pub-id> </citation>
</ref>
<ref id="B29">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Yu</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Dou</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Gao</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>KLF4-Mediated CDH3 Upregulation Suppresses Human Hepatoma Cell Growth and Migration via GSK-3&#x3b2; Signaling</article-title>. <source>Int. J.&#x20;Biol. Sci.</source> <volume>15</volume>, <fpage>953</fpage>&#x2013;<lpage>961</lpage>. <pub-id pub-id-type="doi">10.7150/ijbs.30857</pub-id> </citation>
</ref>
<ref id="B30">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Jiang</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Pang</surname>
<given-names>W.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Joint Multiple Fully Connected Convolutional Neural Network with Extreme Learning Machine for Hepatocellular Carcinoma Nuclei Grading</article-title>. <source>Comput. Biol. Med.</source> <volume>84</volume>, <fpage>156</fpage>&#x2013;<lpage>167</lpage>. <pub-id pub-id-type="doi">10.1016/j.compbiomed.2017.03.017</pub-id> </citation>
</ref>
<ref id="B31">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liang</surname>
<given-names>J.-D.</given-names>
</name>
<name>
<surname>Ping</surname>
<given-names>X.-O.</given-names>
</name>
<name>
<surname>Tseng</surname>
<given-names>Y.-J.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>G.-T.</given-names>
</name>
<name>
<surname>Lai</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>P.-M.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Recurrence Predictive Models for Patients with Hepatocellular Carcinoma after Radiofrequency Ablation Using Support Vector Machines with Feature Selection Methods</article-title>. <source>Comp. Methods Programs Biomed.</source> <volume>117</volume>, <fpage>425</fpage>&#x2013;<lpage>434</lpage>. <pub-id pub-id-type="doi">10.1016/j.cmpb.2014.09.001</pub-id> </citation>
</ref>
<ref id="B32">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mesci</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Taeb</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Jahangiri</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Kim</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Fokas</surname>
<given-names>E.</given-names>
</name>
<etal/>
</person-group> (<year>2017</year>). <article-title>Targeting of CCBE1 by miR-330-3p in Human Breast Cancer Promotes Metastasis</article-title>. <source>Br. J.&#x20;Cancer</source> <volume>116</volume>, <fpage>1350</fpage>&#x2013;<lpage>1357</lpage>. <pub-id pub-id-type="doi">10.1038/bjc.2017.105</pub-id> </citation>
</ref>
<ref id="B33">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nakayama</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Takayama</surname>
<given-names>T.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Role of Surgical Resection for Hepatocellular Carcinoma Based on Japanese Clinical Guidelines for Hepatocellular Carcinoma</article-title>. <source>Wjh</source> <volume>7</volume>, <fpage>261</fpage>&#x2013;<lpage>269</lpage>. <pub-id pub-id-type="doi">10.4254/wjh.v7.i2.261</pub-id> </citation>
</ref>
<ref id="B34">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ness</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Katta</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Garred</surname>
<given-names>&#xd8;.</given-names>
</name>
<name>
<surname>Kumar</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Olstad</surname>
<given-names>O. K.</given-names>
</name>
<name>
<surname>Petrovski</surname>
<given-names>G.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Integrated Differential DNA Methylation and Gene Expression of Formalin-Fixed Paraffin-Embedded Uveal Melanoma Specimens Identifies Genes Associated with Early Metastasis and Poor Prognosis</article-title>. <source>Exp. Eye Res.</source> <volume>203</volume>, <fpage>108426</fpage>. <pub-id pub-id-type="doi">10.1016/j.exer.2020.108426</pub-id> </citation>
</ref>
<ref id="B35">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nick</surname>
<given-names>T. G.</given-names>
</name>
<name>
<surname>Campbell</surname>
<given-names>K. M.</given-names>
</name>
</person-group> (<year>2007</year>). <article-title>Logistic Regression</article-title>. <source>Methods Mol. Biol.</source> <volume>404</volume>, <fpage>273</fpage>&#x2013;<lpage>301</lpage>. <pub-id pub-id-type="doi">10.1007/978-1-59745-530-5_14</pub-id> </citation>
</ref>
<ref id="B36">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ntzani</surname>
<given-names>E. E.</given-names>
</name>
<name>
<surname>Ioannidis</surname>
<given-names>J.&#x20;P.</given-names>
</name>
</person-group> (<year>2003</year>). <article-title>Predictive Ability of DNA Microarrays for Cancer Outcomes and Correlates: An Empirical Assessment</article-title>. <source>The Lancet</source> <volume>362</volume>, <fpage>1439</fpage>&#x2013;<lpage>1444</lpage>. <pub-id pub-id-type="doi">10.1016/S0140-6736(03)14686-7</pub-id> </citation>
</ref>
<ref id="B37">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Olkhanud</surname>
<given-names>P. B.</given-names>
</name>
<name>
<surname>Damdinsuren</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Bodogai</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Gress</surname>
<given-names>R. E.</given-names>
</name>
<name>
<surname>Sen</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Wejksza</surname>
<given-names>K.</given-names>
</name>
<etal/>
</person-group> (<year>2011</year>). <article-title>Tumor-Evoked Regulatory B&#x20;Cells Promote Breast Cancer Metastasis by Converting Resting CD4&#x2b; T&#x20;Cells to T-Regulatory Cells</article-title>. <source>Cancer Res.</source> <volume>71</volume>, <fpage>3505</fpage>&#x2013;<lpage>3515</lpage>. <pub-id pub-id-type="doi">10.1158/0008-5472.CAN-10-4316</pub-id> </citation>
</ref>
<ref id="B38">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ou</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Yeh</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Qi</surname>
<given-names>L.</given-names>
</name>
<etal/>
</person-group> (<year>2015</year>). <article-title>Tumor Microenvironment B&#x20;Cells Increase Bladder Cancer Metastasisviamodulation of the IL-8/androgen Receptor (AR)/MMPs Signals</article-title>. <source>Oncotarget</source> <volume>6</volume>, <fpage>26065</fpage>&#x2013;<lpage>26078</lpage>. <pub-id pub-id-type="doi">10.18632/oncotarget.4569</pub-id> </citation>
</ref>
<ref id="B39">
<citation citation-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Reif</surname>
<given-names>D. M.</given-names>
</name>
<name>
<surname>Motsinger</surname>
<given-names>A. A.</given-names>
</name>
<name>
<surname>McKinney</surname>
<given-names>B. A.</given-names>
</name>
<name>
<surname>Crowe</surname>
<given-names>J.&#x20;E.</given-names>
</name>
<name>
<surname>Moore</surname>
<given-names>J.&#x20;H.</given-names>
</name>
</person-group> (<year>2006</year>). &#x201c;<article-title>Feature Selection Using a Random Forests Classifier for the Integrated Analysis of Multiple Data Types</article-title>,&#x201d; in <conf-name>IEEE Symposium on Computational Intelligence and Bioinformatics and Computational Biology</conf-name>, <conf-loc>Toronto, ON, Canada</conf-loc>, <conf-date>September 28-29, 2006</conf-date>, <fpage>1</fpage>&#x2013;<lpage>8</lpage>. <pub-id pub-id-type="doi">10.1109/CIBCB.2006.330987</pub-id> </citation>
</ref>
<ref id="B40">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sanchez-pinto</surname>
<given-names>L. N.</given-names>
</name>
<name>
<surname>Venable</surname>
<given-names>L. R.</given-names>
</name>
<name>
<surname>Fahrenbach</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Churpek</surname>
<given-names>M. M.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Comparison of Variable Selection Methods for Clinical Predictive Modeling</article-title>. <source>Int. J.&#x20;Med. Inform.</source> <volume>116</volume>, <fpage>10</fpage>&#x2013;<lpage>17</lpage>. <pub-id pub-id-type="doi">10.1016/j.ijmedinf.2018.05.006</pub-id> </citation>
</ref>
<ref id="B41">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Somura</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Iizuka</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Tamesa</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Sakamoto</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Hamaguchi</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Tsunedomi</surname>
<given-names>R.</given-names>
</name>
<etal/>
</person-group> (<year>2008</year>). <article-title>A Three-Gene Predictor for Early Intrahepatic Recurrence of Hepatocellular Carcinoma after Curative Hepatectomy</article-title>. <source>Oncol. Rep.</source> <volume>19</volume>, <fpage>489</fpage>&#x2013;<lpage>495</lpage>. <pub-id pub-id-type="doi">10.3892/or.19.2.489</pub-id> </citation>
</ref>
<ref id="B42">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Song</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Cui</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Wen</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>Y.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>CCBE1 Promotes Tumor Lymphangiogenesis and Is Negatively Regulated by TGF&#x3b2; Signaling in Colorectal Cancer</article-title>. <source>Theranostics</source> <volume>10</volume>, <fpage>2327</fpage>&#x2013;<lpage>2341</lpage>. <pub-id pub-id-type="doi">10.7150/thno.39740</pub-id> </citation>
</ref>
<ref id="B43">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Stamatopoulos</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Smith</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Crompot</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Pieters</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Clifford</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Mraz</surname>
<given-names>M.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>The Light Chain IgLV3-21 Defines a New Poor Prognostic Subgroup in Chronic Lymphocytic Leukemia: Results of a Multicenter Study</article-title>. <source>Clin. Cancer Res.</source> <volume>24</volume>, <fpage>5048</fpage>&#x2013;<lpage>5057</lpage>. <pub-id pub-id-type="doi">10.1158/1078-0432.CCR-18-0133</pub-id> </citation>
</ref>
<ref id="B44">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sun</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Zhong</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zhou</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Hou</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Z.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Single-cell Landscape of the Ecosystem in Early-Relapse Hepatocellular Carcinoma</article-title>. <source>Cell</source> <volume>184</volume>, <fpage>404</fpage>&#x2013;<lpage>421</lpage>. <pub-id pub-id-type="doi">10.1016/j.cell.2020.11.041</pub-id> </citation>
</ref>
<ref id="B45">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Taniuchi</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Nakagawa</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Hosokawa</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Nakamura</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Eguchi</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Ohigashi</surname>
<given-names>H.</given-names>
</name>
<etal/>
</person-group> (<year>2005</year>). <article-title>Overexpressed P-cadherin/CDH3 Promotes Motility of Pancreatic Cancer Cells by Interacting with P120ctn and Activating Rho-Family GTPases</article-title>. <source>Cancer Res.</source> <volume>65</volume>, <fpage>3092</fpage>&#x2013;<lpage>3099</lpage>. <pub-id pub-id-type="doi">10.1158/0008.5472.CAN-04-3646</pub-id> </citation>
</ref>
<ref id="B46">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tibshirani</surname>
<given-names>R.</given-names>
</name>
</person-group> (<year>1996</year>). <article-title>Regression Shrinkage and Selection via the Lasso</article-title>. <source>J.&#x20;R. Stat. Soc. Ser. B (Methodological)</source> <volume>58</volume>, <fpage>267</fpage>&#x2013;<lpage>288</lpage>. <pub-id pub-id-type="doi">10.1111/j.2517-6161.1996.tb02080.x</pub-id> </citation>
</ref>
<ref id="B47">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Luo</surname>
<given-names>Z.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>An Experimental Study of the Intrinsic Stability of Random forest Variable Importance Measures</article-title>. <source>BMC Bioinformatics</source> <volume>17</volume>, <fpage>60</fpage>. <pub-id pub-id-type="doi">10.1186/s12859-016-0900-5</pub-id> </citation>
</ref>
<ref id="B48">
<citation citation-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Zhou</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Wonka</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Ye</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2014</year>). &#x201c;<article-title>A Safe Screening Rule for Sparse Logistic Regression</article-title>,&#x201d; in <conf-name>Proceedings of the 27th International Conference on Neural Information Processing Systems</conf-name>, <conf-loc>Montreal, Canada</conf-loc>, <conf-date>December 8 - 13, 2014</conf-date>, <volume>2</volume>, <fpage>1053</fpage>&#x2013;<lpage>1061</lpage>. </citation>
</ref>
<ref id="B49">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Lv</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Ma</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Gu</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Du</surname>
<given-names>Y.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>A Five-Gene Signature for Recurrence Prediction of Hepatocellular Carcinoma Patients</article-title>. <source>Biomed. Res. Int.</source> <volume>2020</volume>, <fpage>1</fpage>&#x2013;<lpage>13</lpage>. <pub-id pub-id-type="doi">10.1155/2020/4037639</pub-id> </citation>
</ref>
<ref id="B50">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Woo</surname>
<given-names>H. G.</given-names>
</name>
<name>
<surname>Park</surname>
<given-names>E. S.</given-names>
</name>
<name>
<surname>Cheon</surname>
<given-names>J.&#x20;H.</given-names>
</name>
<name>
<surname>Kim</surname>
<given-names>J.&#x20;H.</given-names>
</name>
<name>
<surname>Lee</surname>
<given-names>J.-S.</given-names>
</name>
<name>
<surname>Park</surname>
<given-names>B. J.</given-names>
</name>
<etal/>
</person-group> (<year>2008</year>). <article-title>Gene Expression-Based Recurrence Prediction of Hepatitis B Virus-Related Human Hepatocellular Carcinoma</article-title>. <source>Clin. Cancer Res.</source> <volume>14</volume>, <fpage>2056</fpage>&#x2013;<lpage>2064</lpage>. <pub-id pub-id-type="doi">10.1158/1078-0432.CCR-07-1473</pub-id> </citation>
</ref>
<ref id="B51">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xu</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Dai</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Xie</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Dong</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>High Expression of CDH3 Predicts a Good Prognosis for colon Adenocarcinoma Patients</article-title>. <source>Exp. Ther. Med.</source> <volume>18</volume>, <fpage>841</fpage>&#x2013;<lpage>847</lpage>. <pub-id pub-id-type="doi">10.3892/etm.2019.7638</pub-id> </citation>
</ref>
<ref id="B52">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xu-Monette</surname>
<given-names>Z. Y.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Xia</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Crossley</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Bremel</surname>
<given-names>R. D.</given-names>
</name>
<name>
<surname>Miao</surname>
<given-names>Y.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>Immunoglobulin Somatic Hypermutation Has Clinical Impact in DLBCL and Potential Implications for Immune Checkpoint Blockade and Neoantigen-Based Immunotherapies</article-title>. <source>J.&#x20;Immunotherapy Cancer</source> <volume>7</volume>, <fpage>272</fpage>. <pub-id pub-id-type="doi">10.1186/s40425-019-0730-x</pub-id> </citation>
</ref>
<ref id="B53">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yoshihara</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Shahmoradgoli</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Mart&#xed;nez</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Vegesna</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Kim</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Torres-Garcia</surname>
<given-names>W.</given-names>
</name>
<etal/>
</person-group> (<year>2013</year>). <article-title>Inferring Tumour Purity and Stromal and Immune Cell Admixture from Expression Data</article-title>. <source>Nat. Commun.</source> <volume>4</volume>, <fpage>2612</fpage>. <pub-id pub-id-type="doi">10.1038/ncomms3612</pub-id> </citation>
</ref>
<ref id="B54">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yu</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Deng</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Zhou</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Jia</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Xiao</surname>
<given-names>T.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Lymph Node Metastasis Prediction of Papillary Thyroid Carcinoma Based on Transfer Learning Radiomics</article-title>. <source>Nat. Commun.</source> <volume>11</volume>, <fpage>965</fpage>&#x2013;<lpage>975</lpage>. <pub-id pub-id-type="doi">10.1038/s41467-020-18497-3</pub-id> </citation>
</ref>
<ref id="B55">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Deng</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Fan</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Gonzalez</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Brezski</surname>
<given-names>R. J.</given-names>
</name>
<etal/>
</person-group> (<year>2015</year>). <article-title>Dysfunctional Antibodies in the Tumor Microenvironment Associate with Impaired Anticancer Immunity</article-title>. <source>Clin. Cancer Res.</source> <volume>21</volume>, <fpage>5380</fpage>&#x2013;<lpage>5390</lpage>. <pub-id pub-id-type="doi">10.1158/1078-0432.CCR-15-1057</pub-id> </citation>
</ref>
<ref id="B56">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhou</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Sprengers</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Mancham</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Erkens</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Boor</surname>
<given-names>P. P. C.</given-names>
</name>
<name>
<surname>van Beek</surname>
<given-names>A. A.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>Reduction of Immunosuppressive Tumor Microenvironment in Cholangiocarcinoma by <italic>Ex Vivo</italic> Targeting Immune Checkpoint Molecules</article-title>. <source>J.&#x20;Hepatol.</source> <volume>71</volume>, <fpage>753</fpage>&#x2013;<lpage>762</lpage>. <pub-id pub-id-type="doi">10.1016/j.jhep.2019.05.026</pub-id> </citation>
</ref>
<ref id="B57">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhu</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Cheng</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>Z.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>NUDT21 Promotes Tumor Growth and Metastasis through Modulating SGPP2 in Human Gastric Cancer</article-title>. <source>Front. Oncol.</source> <volume>11</volume>, <fpage>670353</fpage>. <pub-id pub-id-type="doi">10.3389/fonc.2021.670353</pub-id> </citation>
</ref>
</ref-list>
</back>
</article>