<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="2.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Oncol.</journal-id>
<journal-title>Frontiers in Oncology</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Oncol.</abbrev-journal-title>
<issn pub-type="epub">2234-943X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fonc.2024.1401496</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Oncology</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Construction of diagnostic models for the progression of hepatocellular carcinoma using machine learning</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" equal-contrib="yes">
<name>
<surname>Jiang</surname>
<given-names>Xin</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="author-notes" rid="fn003">
<sup>&#x2020;</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2684047"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author" equal-contrib="yes">
<name>
<surname>Zhou</surname>
<given-names>Ruilong</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<xref ref-type="author-notes" rid="fn003">
<sup>&#x2020;</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Jiang</surname>
<given-names>Fengle</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2618663"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Yan</surname>
<given-names>Yanan</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Zhang</surname>
<given-names>Zheting</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Wang</surname>
<given-names>Jianmin</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="author-notes" rid="fn001">
<sup>*</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1595966"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>Innovation Center for Cancer Research, Clinical Oncology School of Fujian Medical University, Fujian Cancer Hospital</institution>, <addr-line>Fuzhou</addr-line>, <country>China</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>Fujian Key Laboratory of Advanced Technology for Cancer Screening and Early Diagnosis</institution>, <addr-line>Fuzhou</addr-line>, <country>China</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>Faculty of Medicine, The Chinese University of Hong Kong</institution>, <addr-line>Hong Kong</addr-line>, <country>Hong Kong SAR, China</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>Edited by: Francisco Tustumi, University of S&#xe3;o Paulo, Brazil</p>
</fn>
<fn fn-type="edited-by">
<p>Reviewed by: Jonathan Soldera, University of Caxias do Sul, Brazil</p>
<p>Zeynep Kucukakcali, &#x130;n&#xf6;n&#xfc; University, T&#xfc;rkiye</p>
<p>William Matsui, The University of Texas at Austin, United States</p>
</fn>
<fn fn-type="corresp" id="fn001">
<p>*Correspondence: Jianmin Wang, <email xlink:href="mailto:wangjm8605@163.com">wangjm8605@163.com</email>
</p>
</fn>
<fn fn-type="equal" id="fn003">
<p>&#x2020;These authors have contributed equally to this work</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>15</day>
<month>05</month>
<year>2024</year>
</pub-date>
<pub-date pub-type="collection">
<year>2024</year>
</pub-date>
<volume>14</volume>
<elocation-id>1401496</elocation-id>
<history>
<date date-type="received">
<day>15</day>
<month>03</month>
<year>2024</year>
</date>
<date date-type="accepted">
<day>29</day>
<month>04</month>
<year>2024</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2024 Jiang, Zhou, Jiang, Yan, Zhang and Wang</copyright-statement>
<copyright-year>2024</copyright-year>
<copyright-holder>Jiang, Zhou, Jiang, Yan, Zhang and Wang</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>Liver cancer is one of the most prevalent forms of cancer worldwide. A significant proportion of patients with hepatocellular carcinoma (HCC) are diagnosed at advanced stages, leading to unfavorable treatment outcomes. Generally, the development of HCC occurs in distinct stages. However, the diagnostic and intervention markers for each stage remain unclear. Therefore, there is an urgent need to explore precise grading methods for HCC. Machine learning has emerged as an effective technique for studying precise tumor diagnosis. In this research, we employed random forest and LightGBM machine learning algorithms for the first time to construct diagnostic models for HCC at various stages of progression. We categorized 118 samples from GSE114564 into three groups: normal liver, precancerous lesion (including chronic hepatitis, liver cirrhosis, dysplastic nodule), and HCC (including early stage HCC and advanced HCC). The LightGBM model exhibited outstanding performance (accuracy = 0.96, precision = 0.96, recall = 0.96, F1-score = 0.95). Similarly, the random forest model also demonstrated good performance (accuracy = 0.83, precision = 0.83, recall = 0.83, F1-score = 0.83). When the progression of HCC was categorized into the most refined six stages: normal liver, chronic hepatitis, liver cirrhosis, dysplastic nodule, early stage HCC, and advanced HCC, the diagnostic model still exhibited high efficacy. Among them, the LightGBM model exhibited good performance (accuracy = 0.71, precision = 0.71, recall = 0.71, F1-score = 0.72). Also, performance of the LightGBM model was superior to that of the random forest model. Overall, we have constructed a diagnostic model for the progression of HCC and identified potential diagnostic characteristic gene for the progression of HCC.</p>
</abstract>
<kwd-group>
<kwd>liver cancer</kwd>
<kwd>machine learning</kwd>
<kwd>random forest model</kwd>
<kwd>LightGBM model</kwd>
<kwd>the progression of HCC</kwd>
</kwd-group>
<counts>
<fig-count count="10"/>
<table-count count="6"/>
<equation-count count="0"/>
<ref-count count="43"/>
<page-count count="11"/>
<word-count count="3548"/>
</counts>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-in-acceptance</meta-name>
<meta-value>Gastrointestinal Cancers: Hepato Pancreatic Biliary Cancers</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec id="s1" sec-type="intro">
<title>Introduction</title>
<p>According to the recent data on global cancer burden in 2020, liver cancer ranked as the sixth most common cancer in terms of incidence rate and the third highest in terms of mortality (<xref ref-type="bibr" rid="B1">1</xref>). A considerable percentage of patients diagnosed with hepatocellular carcinoma (HCC) are at an advanced stage. Therefore, the identification of diagnostic markers is of immense importance (<xref ref-type="bibr" rid="B2">2</xref>&#x2013;<xref ref-type="bibr" rid="B4">4</xref>). The development of HCC is a gradual process. Patients with chronic liver disease experience persistent liver inflammation, fibrosis, and abnormal regeneration of liver cells. These abnormalities can lead to cirrhosis and gradually give rise to dysplastic nodules of precancerous lesions. Finally, the patients will develop HCC (<xref ref-type="bibr" rid="B5">5</xref>). However, the marker gene for HCC progression remain unclear.</p>
<p>Thus, there is an urgent need to identify markers and develop precise diagnostic model for progression of HCC. With the development of artificial intelligence, machine learning has shown promise in cancer diagnosis and treatment (<xref ref-type="bibr" rid="B6">6</xref>, <xref ref-type="bibr" rid="B7">7</xref>). For example, Zhang (<xref ref-type="bibr" rid="B8">8</xref>) developed a machine learning-based model for the early detection of liver cancer by utilizing low-depth whole genome sequencing of cell-free DNA. The model achieved an AUC of 0.995, a sensitivity of 0.968, and a specificity of 0.988 in differentiating between liver cancer and non-liver cancer. According to feature selection, Tang (<xref ref-type="bibr" rid="B9">9</xref>) used Least Absolute Shrinkage and Selector Operation (Lasso), Support Vector Machine (SVM), and Random Forest (RF) to construct HCC classification models for HCC saliva samples. The diagnostic accuracy of the LASSO-HCC model was 0.706, the diagnostic accuracy of the SVM-HCC model was 0.812, and the diagnostic accuracy of the RF-HCC model was 0.859.</p>
<p>However, these studies exclusively focused on particular stages in the progression of HCC. In this research, we aim to develop an accurate diagnostic model for the progression of HCC by utilizing machine learning algorithms, such as RF and LightGBM. The RF and LightGBM models are two commonly used machine learning algorithms known for their strong performance and effectiveness in dealing with classification and regression problems.</p>
<p>RF is an ensemble learning algorithm that enhances prediction accuracy by constructing multiple decision trees and taking the average of the predictions from these trees. RF can reduce overfitting, is tolerant to missing values, and can assess the importance of each feature, aiding in data comprehension (<xref ref-type="bibr" rid="B10">10</xref>, <xref ref-type="bibr" rid="B11">11</xref>). LightGBM is a distributed and high-performance algorithm designed for gradient-boosting decision trees, specifically based on the Histogram algorithm, characterized by efficiency, speed, and high accuracy. Principle of LightGBM is to iteratively train multiple decision trees and train the next tree based on the results of the previous tree to minimize the loss function (<xref ref-type="bibr" rid="B12">12</xref>, <xref ref-type="bibr" rid="B13">13</xref>). Combining the RF and LightGBM models can yield more comprehensive and accurate results in research. These two algorithms have outstanding performance in cancer diagnostics (<xref ref-type="bibr" rid="B14">14</xref>).</p>
<p>In this research, we classified 118 samples from GSE114564 into three groups: normal liver, precancerous lesion, and HCC. The RF model and LightGBM model showed strong performance and identified 12 characteristic genes. Additionally, the diagnostic model still exhibited high efficacy when categorizing the progression of HCC into six finely stratified stages. To the best of our knowledge, this research represented the first application of machine learning to comprehensively cover all stages of HCC progression.</p>
</sec>
<sec id="s2" sec-type="materials|methods">
<title>Materials and methods</title>
<sec id="s2_1">
<title>Patients</title>
<p>This research employed the RNA-sequencing dataset GSE114564 (<xref ref-type="bibr" rid="B15">15</xref>), retrieved from the GEO database, which included transcriptome data from 118 tissue samples representing different stages of HCC. The dataset included 15 normal liver samples, 20 chronic hepatitis samples, 10 liver cirrhosis samples, 10 dysplastic nodule samples, 18 early stage HCC samples, and 45 advanced HCC samples. This comprehensive dataset covers almost all stages for progression of HCC.</p>
</sec>
<sec id="s2_2">
<title>Data processing</title>
<p>We obtained the file &#x201c;GSE114564_Liver_Cancer_FPKM.txt.gz&#x201d; from the GEO database (<ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE114564">https://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE114564</ext-link>). FPKM (fragments per kilobase of exon model per million mapped fragments) of 118 samples were used as the input file, which can effectively eliminate the impact of sequencing depth and gene length on the results. Following that, we conducted an 8:2 random split (<xref ref-type="bibr" rid="B16">16</xref>&#x2013;<xref ref-type="bibr" rid="B18">18</xref>) to partition the 118 available samples into training and validation sets. The 8:2 ratio is commonly regarded as a reasonable choice, because it ensures an adequate sample size for the training set, while also providing a certain number of samples for the validation set to evaluate model performance. Next, we kept genes that are expressed (FPKM&gt;0) in at least three samples and these genes are in scanpy (<xref ref-type="bibr" rid="B19">19</xref>) (scanpy.pp.filter_genes). Then, the data matrix is log-transformed (scanpy.pp.log1p). In the end, we selected the top 1000 genes (<xref ref-type="bibr" rid="B20">20</xref>&#x2013;<xref ref-type="bibr" rid="B22">22</xref>) by the ranking variances of all samples (scanpy.pp.highly_variable_genes), which was performed variance calculation in Scanpy. More specifically, a normalized variance for each gene is computed. First, the data are standardized (i.e., <italic>z</italic>-score normalization per feature) with a regularized standard deviation. Next, the normalized variance is computed as the variance of each gene after the transformation. Genes are ranked by the normalized variance. Finally, we selected the top 1,000 genes (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S1</bold>
</xref>) that demonstrated the highest overall variance in FPKM as the foundation for constructing RF and LightGBM models. The variance calculation and above data processing steps were all implemented in scanpy.</p>
</sec>
<sec id="s2_3">
<title>Construction of machine learning</title>
<p>Subsequently, we employed the Python framework sklearn (<xref ref-type="bibr" rid="B23">23</xref>) to construct the RF model using the RF program (sklearn.ensemble.RandomForestClassifier) and LightGBM program (Lightgbm.sklearn), with all parameters set to default values. The framework sklearn available online is: <ext-link ext-link-type="uri" xlink:href="https://scikit-learn.org/stable/supervised_learning.html">https://scikit-learn.org/stable/supervised_learning.html</ext-link>. Cross-validation was used in this study to find the optimal parameters of the classification model and help the model alleviate overfitting. This study uses fivefold cross-validation on the training dataset, and uses accuracy, precision, recall, and F1-score to evaluate the model performance, and the results are in <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S2</bold>
</xref>.</p>
</sec>
<sec id="s2_4">
<title>Analysis of characteristic gene</title>
<p>The RF and LightGBM models calculated the gene importance and identified the top 50 most important genes (<xref ref-type="bibr" rid="B24">24</xref>), separately (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S3</bold>
</xref>). Furthermore, the intersection of these 50 genes was taken to obtain the feature genes. Upon constructing the aforementioned model, we obtained a set of characteristic genes. Following that, we generated expression heatmap using TBtools HeatMap illustrator program. TBtools is an integrative toolkit developed for interactive analyses of big biological data (<xref ref-type="bibr" rid="B25">25</xref>, <xref ref-type="bibr" rid="B26">26</xref>). Survival analysis was performed using the GEPIA2 database, and GO pathway enrichment was performed using clusterProfiler R package (<xref ref-type="bibr" rid="B27">27</xref>, <xref ref-type="bibr" rid="B28">28</xref>). Finally, we used the GeneCards database (<xref ref-type="bibr" rid="B29">29</xref>) to identify characteristic genes associated with occurrence of HCC (<ext-link ext-link-type="uri" xlink:href="https://www.genecards.org/">https://www.genecards.org/</ext-link>). The workflow diagram for this research was depicted in <xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1</bold>
</xref>.</p>
<fig id="f1" position="float">
<label>Figure&#xa0;1</label>
<caption>
<p>Workflow diagram in this research.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-14-1401496-g001.tif"/>
</fig>
</sec>
</sec>
<sec id="s3" sec-type="results">
<title>Result</title>
<sec id="s3_1">
<title>Constructing machine learning model based three distinct groups</title>
<p>Based on the transformative process of HCC, the data can be categorized into three groups: normal liver, precancerous lesion (including chronic hepatitis, liver cirrhosis, dysplastic nodule), and HCC (including early stage HCC and advanced HCC). We employed the RF and LightGBM algorithms of machine learning to develop a diagnostic model for the progression of HCC. Performance measure of the RF model was presented in <xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2</bold>
</xref> and <xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref>, indicating an accuracy of 0.83, precision of 0.83, recall of 0.83, and F1-score of 0.83. Similarly, performance measure of the LightGBM model indicated an accuracy of 0.96, precision of 0.96, recall of 0.96, and F1-score of 0.95.</p>
<fig id="f2" position="float">
<label>Figure&#xa0;2</label>
<caption>
<p>Confusion matrix of the models. <bold>(A)</bold> Confusion matrix of the random forest model. <bold>(B)</bold> Confusion matrix of the LightGBM model.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-14-1401496-g002.tif"/>
</fig>
<table-wrap id="T1" position="float">
<label>Table&#xa0;1</label>
<caption>
<p>Performance measure of machine learning models based three distinct groups.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="top" align="left">Model</th>
<th valign="top" align="left">Accuracy</th>
<th valign="top" align="left">Precision</th>
<th valign="top" align="left">Recall</th>
<th valign="top" align="left">F1-score</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Random forest</td>
<td valign="top" align="left">0.83</td>
<td valign="top" align="left">0.83</td>
<td valign="top" align="left">0.83</td>
<td valign="top" align="left">0.83</td>
</tr>
<tr>
<td valign="top" align="left">LightGBM</td>
<td valign="top" align="left">0.96</td>
<td valign="top" align="left">0.96</td>
<td valign="top" align="left">0.96</td>
<td valign="top" align="left">0.95</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>According to the method, the models above comprised a total of 12 characteristic genes (<italic>CLEC3B</italic>, <italic>RN7SL5P</italic>, <italic>RP11&#x2013;977G19.10</italic>, <italic>ASPDH</italic>, <italic>CFP</italic>, <italic>CDC37L1-AS1</italic>, <italic>RN7SL752P</italic>, <italic>U3</italic>, <italic>IGFALS</italic>, <italic>MASP2</italic>, <italic>RN7SKP255</italic>, <italic>RP11&#x2013;162P23.2</italic>). Next, we utilized TBtools to generate expression heatmap for these 12 characteristic genes (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figure S1</bold>
</xref>). The characteristic genes are primarily involved in complement activation, activation of immune response, cytoplasmic vesicle lumen, complement binding, oxidoreductase activity, and other pathways (<italic>q</italic> &lt; 0.05; <xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3</bold>
</xref>).</p>
<fig id="f3" position="float">
<label>Figure&#xa0;3</label>
<caption>
<p>Go pathway enrichment of characteristic genes.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-14-1401496-g003.tif"/>
</fig>
<p>Among these genes, we found that poor prognosis was associated with low expression of <italic>CLEC3B</italic>, <italic>CDC37L1-AS1</italic>, <italic>IGFALS</italic>, and <italic>MASP2</italic> (Logrank <italic>p</italic> &lt; 0.05; <xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4</bold>
</xref>). Moreover, both <italic>CLEC3B</italic> and <italic>IGFALS</italic> showed a strong association with the occurrence of HCC (<xref ref-type="table" rid="T2">
<bold>Table&#xa0;2</bold>
</xref>) (<xref ref-type="bibr" rid="B30">30</xref>, <xref ref-type="bibr" rid="B31">31</xref>).</p>
<fig id="f4" position="float">
<label>Figure&#xa0;4</label>
<caption>
<p>Overall survival of HCC genes in GEPIA2 database. <bold>(A)</bold> Overall survival of <italic>CLEC3B.</italic> <bold>(B)</bold> Overall survival of <italic>CDC37L1-AS1.</italic> <bold>(C)</bold> Overall survival of <italic>IGFALS.</italic> <bold>(D)</bold> Overall survival of <italic>MASP2</italic>.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-14-1401496-g004.tif"/>
</fig>
<table-wrap id="T2" position="float">
<label>Table&#xa0;2</label>
<caption>
<p>
<italic>CLEC3B</italic> and <italic>IGFALS</italic> reported in HCC from GeneCards database.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="top" align="left">GeneName</th>
<th valign="top" align="left">Location</th>
<th valign="top" align="left">Function summaries</th>
<th valign="top" align="left">Related pathways</th>
<th valign="top" align="left">Report</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">
<italic>CLEC3B</italic>
</td>
<td valign="top" align="left">3p21.31</td>
<td valign="top" align="left">May be involved in the packaging of molecules destined for exocytosis.</td>
<td valign="top" align="left">Platelet activation, signaling and aggregation.</td>
<td valign="top" align="left">(<xref ref-type="bibr" rid="B30">30</xref>)</td>
</tr>
<tr>
<td valign="top" align="left">
<italic>IGFALS</italic>
</td>
<td valign="top" align="left">16p13.3</td>
<td valign="top" align="left">Encoded by this gene is a serum protein that binds insulin-like growth factors, increasing their half-life and the vascular localization.</td>
<td valign="top" align="left">1.Regulation of Insulin-like Growth Factor.<break/>2.Inulin-like growth factor binding.</td>
<td valign="top" align="left">(<xref ref-type="bibr" rid="B31">31</xref>)</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="s3_2">
<title>Constructing machine learning model based four distinct groups</title>
<p>In order to further investigate the effectiveness of machine learning models in classifying early stage HCC, we categorized the data into four groups: normal liver, precancerous lesion (including chronic hepatitis, liver cirrhosis, dysplastic nodule), early stage HCC, and advanced HCC. Performance measure of the random forest model was presented in <xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5</bold>
</xref>, <xref ref-type="table" rid="T3">
<bold>Table&#xa0;3</bold>
</xref>, indicating an accuracy of 0.83, precision of 0.83, recall of 0.83, and F1-score of 0.83. Similarly, performance measure of the LightGBM model indicated an accuracy of 0.75, precision of 0.75, recall of 0.75, and F1-score of 0.76.</p>
<fig id="f5" position="float">
<label>Figure&#xa0;5</label>
<caption>
<p>Confusion matrix of the models. <bold>(A)</bold> Confusion matrix of the random forest model. <bold>(B)</bold> Confusion matrix of the LightGBM model.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-14-1401496-g005.tif"/>
</fig>
<table-wrap id="T3" position="float">
<label>Table&#xa0;3</label>
<caption>
<p>Performance measure of machine learning models based four distinct groups.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="top" align="left">Model</th>
<th valign="top" align="left">Accuracy</th>
<th valign="top" align="left">Precision</th>
<th valign="top" align="left">Recall</th>
<th valign="top" align="left">F1-score</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Random forest</td>
<td valign="top" align="left">0.83</td>
<td valign="top" align="left">0.83</td>
<td valign="top" align="left">0.83</td>
<td valign="top" align="left">0.83</td>
</tr>
<tr>
<td valign="top" align="left">LightGBM</td>
<td valign="top" align="left">0.75</td>
<td valign="top" align="left">0.75</td>
<td valign="top" align="left">0.75</td>
<td valign="top" align="left">0.76</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>According to the method, the models above comprised a total of 12 characteristic genes (<italic>HBA2</italic>, <italic>RP11&#x2013;977G19.10</italic>, <italic>AC004538.3</italic>, <italic>INS-IGF2</italic>, <italic>RNU2&#x2013;63P</italic>, <italic>RN7SL752P</italic>, <italic>U3</italic>, <italic>VIPR1</italic>, <italic>MASP2</italic>, <italic>TDO2</italic>, <italic>RN7SKP255</italic>, <italic>RP11&#x2013;162P23.2</italic>). Furthermore, we utilized TBtools to generate expression heatmap for these 12 characteristic genes (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figure S2</bold>
</xref>). The characteristic genes are primarily enriched in pathways associated with the tryptophan metabolic process, hemoglobin complex, oxygen binding, and other pathways (<italic>q</italic> &lt; 0.05; <xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6</bold>
</xref>).</p>
<fig id="f6" position="float">
<label>Figure&#xa0;6</label>
<caption>
<p>GO pathway enrichment of characteristic genes.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-14-1401496-g006.tif"/>
</fig>
<p>Regarding these genes, low expression of <italic>AC004538.3</italic>, <italic>VIPR1</italic>, and <italic>MASP2</italic> was associated with a poor prognosis (Logrank <italic>p</italic> &lt; 0.05; <xref ref-type="fig" rid="f7">
<bold>Figure&#xa0;7</bold>
</xref>). Furthermore, <italic>VIPR1</italic> exhibited a strong association with the occurrence of HCC (<xref ref-type="table" rid="T4">
<bold>Table&#xa0;4</bold>
</xref>) (<xref ref-type="bibr" rid="B32">32</xref>).</p>
<fig id="f7" position="float">
<label>Figure&#xa0;7</label>
<caption>
<p>Overall survival of HCC genes in GEPIA2 database. <bold>(A)</bold> Overall survival of <italic>AC004538.3</italic>. <bold>(B)</bold> Overall survival of <italic>VIPR1</italic>. <bold>(C)</bold> Overall survival of <italic>MASP2.</italic>.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-14-1401496-g007.tif"/>
</fig>
<table-wrap id="T4" position="float">
<label>Table&#xa0;4</label>
<caption>
<p>
<italic>VIPR1</italic> reported in HCC from GeneCards database.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="top" align="left">GeneName</th>
<th valign="top" align="left">Location</th>
<th valign="top" align="left">Function summaries</th>
<th valign="top" align="left">Related pathways</th>
<th valign="top" align="left">Report</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">
<italic>VIPR1</italic>
</td>
<td valign="top" align="left">3p22.1</td>
<td valign="top" align="left">This is a receptor for VIP. The activity of this receptor is mediated by G proteins which activate adenylyl cyclase.</td>
<td valign="top" align="left">1.Glucocorticoid receptor regulatory network.<break/>2.GPCR downstream signal.</td>
<td valign="top" align="left">(<xref ref-type="bibr" rid="B32">32</xref>)</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="s3_3">
<title>Constructing machine learning model based six distinct groups</title>
<p>We further investigated the efficacy of classifying the progression of HCC across all various stages. To achieve this, we categorized the data into six groups: normal liver, chronic hepatitis, liver cirrhosis, dysplastic nodule, early stage HCC, and advanced HCC. Performance measure of the random forest model was presented in <xref ref-type="fig" rid="f8">
<bold>Figure&#xa0;8</bold>
</xref> and <xref ref-type="table" rid="T5">
<bold>Table&#xa0;5</bold>
</xref>, indicating an accuracy of 0.63, precision of 0.63, recall of 0.63, and F1-score of 0.59. Similarly, performance measure of the LightGBM model indicated an accuracy of 0.71, precision of 0.71, recall of 0.71, and F1-score of 0.72.</p>
<fig id="f8" position="float">
<label>Figure&#xa0;8</label>
<caption>
<p>Confusion matrix of the models. <bold>(A)</bold> Confusion matrix of the random forest model. <bold>(B)</bold> Confusion matrix of the LightGBM model.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-14-1401496-g008.tif"/>
</fig>
<table-wrap id="T5" position="float">
<label>Table&#xa0;5</label>
<caption>
<p>Performance measure of machine learning models based six distinct groups.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="top" align="left">Model</th>
<th valign="top" align="left">Accuracy</th>
<th valign="top" align="left">Precision</th>
<th valign="top" align="left">Recall</th>
<th valign="top" align="left">F1-score</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Random forest</td>
<td valign="top" align="left">0.63</td>
<td valign="top" align="left">0.63</td>
<td valign="top" align="left">0.63</td>
<td valign="top" align="left">0.59</td>
</tr>
<tr>
<td valign="top" align="left">LightGBM</td>
<td valign="top" align="left">0.71</td>
<td valign="top" align="left">0.71</td>
<td valign="top" align="left">0.71</td>
<td valign="top" align="left">0.72</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>According to the method, the models above comprised a total of 16 characteristic genes (<italic>C1QTNF1</italic>, <italic>JUNB</italic>, <italic>CLEC3B</italic>, <italic>SERPINA11</italic>, <italic>RP11&#x2013;977G19.10</italic>, <italic>CCNB1</italic>, <italic>CDC37L1-AS1</italic>, <italic>CFB</italic>, <italic>RN7SL752P</italic>, <italic>CCL14</italic>, <italic>U3</italic>, <italic>F12</italic>, <italic>ACSL4</italic>, <italic>MOGAT2</italic>, <italic>RN7SKP255</italic>, and <italic>TERC</italic>). Furthermore, we utilized TBtools to generate expression heatmap for these 16 characteristic genes (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figure S3</bold>
</xref>). The characteristic genes are primarily enriched in pathways associated with regulation of plasminogen activation, positive regulation of protein processing, and other pathways (<italic>q</italic> &lt; 0.05; <xref ref-type="fig" rid="f9">
<bold>Figure&#xa0;9</bold>
</xref>).</p>
<fig id="f9" position="float">
<label>Figure&#xa0;9</label>
<caption>
<p>GO pathway enrichment of characteristic genes.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-14-1401496-g009.tif"/>
</fig>
<p>Regarding these genes, low expression of <italic>CLEC3B</italic>, <italic>CDC37L1-AS1</italic>, <italic>CFB, CCL14</italic>, and <italic>MOGAT2</italic> was associated with poor prognosis, while high expression of <italic>CCNB1</italic> and <italic>ACSL4</italic> was associated with a poor prognosis (<xref ref-type="fig" rid="f10">
<bold>Figure&#xa0;10</bold>
</xref>). Furthermore, <italic>CLEC3B</italic>, <italic>CCNB1</italic>, <italic>CCL14</italic>, and <italic>ACSL4</italic> exhibited a strong association with the occurrence of HCC (<xref ref-type="table" rid="T6">
<bold>Table&#xa0;6</bold>
</xref>) (<xref ref-type="bibr" rid="B30">30</xref>, <xref ref-type="bibr" rid="B33">33</xref>&#x2013;<xref ref-type="bibr" rid="B35">35</xref>).</p>
<fig id="f10" position="float">
<label>Figure&#xa0;10</label>
<caption>
<p>Overall survival of HCC genes in GEPIA2 database. <bold>(A)</bold> Overall survival of <italic>CLEC3B.</italic> <bold>(B)</bold> Overall survival of <italic>CCNB1</italic>. <bold>(C)</bold> Overall survival of <italic>CDC37L1-AS1</italic>. <bold>(D)</bold> Overall survival of <italic>CFB</italic>. <bold>(E)</bold> Overall survival of <italic>CCL14.</italic> <bold>(F)</bold> Overall survival of <italic>ACSL4</italic>. <bold>(G)</bold> Overall survival of <italic>MOGAT2</italic>.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-14-1401496-g010.tif"/>
</fig>
<table-wrap id="T6" position="float">
<label>Table&#xa0;6</label>
<caption>
<p>
<italic>CLEC3B</italic>, <italic>CCNB1</italic>, <italic>CCL14</italic>, and <italic>ACSL4</italic> reported in HCC from GeneCards database.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="top" align="left">GeneName</th>
<th valign="top" align="left">Location</th>
<th valign="top" align="left">Function summaries</th>
<th valign="top" align="left">Related pathways</th>
<th valign="top" align="left">Report</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">
<italic>CLEC3B</italic>
</td>
<td valign="top" align="left">3p21.31</td>
<td valign="top" align="left">Tetranectin binds to plasminogen and to isolated kringle 4. May be involved in the packaging of molecules destined for exocytosis.</td>
<td valign="top" align="left">Platelet activation, signaling and aggregation.</td>
<td valign="top" align="left">(<xref ref-type="bibr" rid="B30">30</xref>)</td>
</tr>
<tr>
<td valign="top" align="left">
<italic>CCNB1</italic>
</td>
<td valign="top" align="left">5q13.2</td>
<td valign="top" align="left">Essential for the control of the cell cycle at the G2/M (mitosis) transition.</td>
<td valign="top" align="left">1.AMPK signaling pathway.<break/>2. Cell cycle</td>
<td valign="top" align="left">(<xref ref-type="bibr" rid="B33">33</xref>)</td>
</tr>
<tr>
<td valign="top" align="left">
<italic>CCL14</italic>
</td>
<td valign="top" align="left">17q12</td>
<td valign="top" align="left">This gene, chemokine (C-C motif) ligand 14, is one of several CC cytokine genes clustered.</td>
<td valign="top" align="left">1.MIF-mediated glucocorticoid regulation and TGF-Beta Pathway.<break/>2.Chemokine activity.</td>
<td valign="top" align="left">(<xref ref-type="bibr" rid="B34">34</xref>)</td>
</tr>
<tr>
<td valign="top" align="left">
<italic>ACSL4</italic>
</td>
<td valign="top" align="left">Xq23</td>
<td valign="top" align="left">Catalyzes the conversion of long-chain fatty acids to their active form acyl-CoA for both synthesis of cellular lipids.</td>
<td valign="top" align="left">Fatty acid metabolism.</td>
<td valign="top" align="left">(<xref ref-type="bibr" rid="B35">35</xref>)</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
</sec>
<sec id="s4" sec-type="discussion">
<title>Discussion</title>
<p>In this research, we employed machine learning algorithms, specifically random forest and LightGBM, to develop accurate diagnostic models for progression of HCC. After multiple analyses, we have identified potential diagnostic markers for the progression of HCC. Interestingly, when we categorized samples into three groups, the classification accuracy of LightGBM algorithm exceeded 0.95. Also, performance of the random forest model was slightly inferior compared to the LightGBM model. The 12 characteristic genes are primarily involved in complement activation, activation of immune response pathways. Simultaneously, among the characteristic gene <italic>CLEC3B</italic> generated from the model, exosomes derived from HCC with downregulated <italic>CLEC3B</italic> were found to promote the migration, invasion, and epithelial-mesenchymal transition of both tumor cells and endothelial cells (<xref ref-type="bibr" rid="B30">30</xref>). In addition, the <italic>IGFALS</italic>, a tumor suppressor gene, undergoes epigenetic silencing, leading to dysregulation of the IGF-II signaling in HCC (<xref ref-type="bibr" rid="B31">31</xref>). Our research indicated that the <italic>CLEC3B</italic> and <italic>IGFALS</italic> may be involved in the progression from normal liver to precancerous lesions to HCC, but their functions require further investigation.</p>
<p>Furthermore, we explored whether this model can accurately distinguish early stage HCC and assessed the potential benefits of early stage HCC diagnosis. And when the samples were categorized into four groups, the random forest model achieved a classification accuracy exceeding 0.83. Moreover, performance of the LightGBM model was slightly inferior compared to the random forest model. The 12 characteristic genes are primarily enriched in pathway associated with metabolic process. Among the characteristic gene generated from the model, loss of <italic>VIPR1</italic> expression in HCC facilitated CAD phosphorylation and tumor progression, suggesting that the restoration of <italic>VIPR1</italic> and treatment with the <italic>VIPR1</italic> agonist may represent a promising approach for HCC treatment (<xref ref-type="bibr" rid="B32">32</xref>, <xref ref-type="bibr" rid="B36">36</xref>). Our research suggested that <italic>VIPR1</italic> may play a role in the classification of early stage HCC and advanced HCC, but further research is needed to determine its specific function.</p>
<p>Moreover, when categorizing the stages of HCC into six distinct levels, the model still exhibits high diagnostic efficacy. These findings provide a solid foundation for precise treatment. The 16 characteristic genes are primarily enriched in pathway associated with positive regulation of protein processing. Among the characteristic gene generated from the model, <italic>CCNB1</italic> may participate in the cell cycle of HCC by regulating DNA replication, thus promoting the development of HCC (<xref ref-type="bibr" rid="B33">33</xref>). And, <italic>CCL14</italic> was a potential prognostic biomarker for determining HCC progression and was associated with immune cell infiltration in HCC (<xref ref-type="bibr" rid="B34">34</xref>, <xref ref-type="bibr" rid="B37">37</xref>). <italic>ACSL4</italic> promoted the progression of HCC by stabilizing c-Myc through the ERK/FBW7/c-Myc axis (<xref ref-type="bibr" rid="B38">38</xref>). Our research suggested that these genes may be involved in all stages of HCC progression and serve as potential biomarkers. However, further in-depth research is needed.</p>
<p>In the past 20 years, sequencing technologies have continuously advanced, leading to explosive growth in available data. Artificial intelligence is often used for the characterization of sequencing data, which can enhance the ability to detect HCC tumors and provide information for disease diagnosis and staging (<xref ref-type="bibr" rid="B39">39</xref>).</p>
<p>Xie (<xref ref-type="bibr" rid="B40">40</xref>) utilized gene expression profiles from peripheral blood to develop an artificial neural network (ANN) model that could differentiate HCC patients from the control group with a sensitivity of 96% and specificity of 86%. Harpreet (<xref ref-type="bibr" rid="B41">41</xref>) utilized a large-scale transcriptomic analysis dataset containing a total of 2,316 HCC samples and 1,665 non-tumor tissue samples to identify HCC samples using machine learning, with an accuracy ranging from 93% to 98%. Although these studies have demonstrated good predictive performance, they did not further differentiate and study non-tumor tissues (pre-cancerous stages).</p>
<p>In addition, A single-center prospective study in the UK recruited 331 cases of liver cell carcinoma, with a control group involving only 339 patients with chronic liver disease. A logistic regression analysis model was constructed, with an AUROC of 0.97 indicating excellent predictive performance. However, the study was only validated in a cohort of patients with fatty liver disease (<xref ref-type="bibr" rid="B42">42</xref>). Xing (<xref ref-type="bibr" rid="B43">43</xref>) conducted mass spectrometry proteomics sequencing and built a random forest machine learning model that clearly distinguished between HCC and healthy individuals (sensitivity 0.975, specificity 1.000), as well as between HCC and cirrhosis (sensitivity 0.925, specificity 0.915). However, these studies did not cover all stages of liver cancer progression.</p>
<p>In our study, we comprehensively cover all stages of liver cancer development, including normal liver, chronic hepatitis, liver cirrhosis, dysplastic nodule, early stage HCC, and advanced HCC. Furthermore, we conducted detailed classifications into three categories, four categories, and six categories respectively, in order to systematically study relevant models of liver cancer progression. When we categorized three groups: normal liver, precancerous lesion (including chronic hepatitis, liver cirrhosis, dysplastic nodule) and HCC (including early stage HCC and advanced HCC), The LightGBM model exhibited outstanding performance (accuracy = 0.96, precision = 0.96, recall = 0.96, F1-score = 0.95). Surprisingly, when the progression of HCC was categorized into the most refined six stages, the diagnostic model still demonstrated high performance (accuracy = 0.71, precision = 0.71, recall = 0.71, F1 score = 0.72). In conclusion, we successfully constructed the most detailed model of HCC progression stages using machine learning methods, providing a theoretical basis for accurate diagnosis of HCC.</p>
<p>In summary, this research represented the pioneering construction of a diagnostic model for HCC progression through the utilization of machine learning methods. The development of liver cancer is a gradual process. Liver cancer patients undergo a process from hepatitis and liver fibrosis to abnormal nodules, ultimately developing into liver cancer. By subdividing into different stages, we can more finely assess the disease progression stage of liver cancer patients and intervene with precision medicine. We hope that targeted early intervention and treatment can prevent the progression of HCC to advanced stage in the future. Additionally, we have identified key genes associated with the progression of liver cancer. Further research on these genes will facilitate the development of effective targets for liver cancer progression. It is important to note that the HCC progression characteristic genes identified in our research still lack sufficient research concerning their impact on progression of HCC, and further exploration is warranted. Of course, it is crucial to validate effectiveness of the model using a larger sample size. Due to the reduced cost of transcriptome sequencing, increasing dataset will arise in the future. In a word, this research holds potential for clinical application due to its significance and prospect.</p>
</sec>
<sec id="s5" sec-type="data-availability">
<title>Data availability statement</title>
<p>The original contributions presented in the study are included in the article/<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Material</bold>
</xref>. Further inquiries can be directed to the corresponding author.</p>
</sec>
<sec id="s6" sec-type="author-contributions">
<title>Author contributions</title>
<p>XJ: Data curation, Formal analysis, Writing &#x2013; original draft,&#xa0;Writing &#x2013; review &amp; editing. RZ: Data curation, Formal&#xa0;analysis,&#xa0;Software, Writing &#x2013; original draft. FJ: Data curation,&#xa0;Investigation, Writing &#x2013; review &amp; editing. YY: Conceptualization,&#xa0;Investigation,&#xa0;Writing &#x2013; review &amp; editing. ZZ: Conceptualization,&#xa0;Supervision, Writing &#x2013; original draft. JW:&#xa0;Conceptualization,&#xa0;Funding acquisition, Investigation, Writing &#x2013; review &amp; editing, Writing &#x2013; original draft.</p>
</sec>
</body>
<back>
<sec id="s7" sec-type="funding-information">
<title>Funding</title>
<p>The author(s) declare financial support was received for the research, authorship, and/or publication of this article. The authors gratefully acknowledge the financial support of the Science Foundation of the Excellent Youth Scholars of Fujian Provincial Health Commission (Grant 2021ZQNZD009), Natural Science Foundation of Fujian Province (Grant 2021J01445).</p>
</sec>
<ack>
<title>Acknowledgments</title>
<p>The authors are grateful for the open source data from GEO.</p>
</ack>
<sec id="s8" sec-type="COI-statement">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec id="s9" sec-type="disclaimer">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec id="s10" sec-type="supplementary-material">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fonc.2024.1401496/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fonc.2024.1401496/full#supplementary-material</ext-link>
</p>
<supplementary-material xlink:href="DataSheet_1.pdf" id="SM1" mimetype="application/pdf"/>
<supplementary-material xlink:href="DataSheet_2.pdf" id="SM2" mimetype="application/pdf"/>
<supplementary-material xlink:href="DataSheet_3.pdf" id="SM3" mimetype="application/pdf"/>
<supplementary-material xlink:href="Table_1.xlsx" id="ST1" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet"/>
<supplementary-material xlink:href="Table_2.xlsx" id="ST2" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet"/>
<supplementary-material xlink:href="Table_3.xlsx" id="ST3" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<label>1</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sung</surname> <given-names>H</given-names>
</name>
<name>
<surname>Ferlay</surname> <given-names>J</given-names>
</name>
<name>
<surname>Siegel</surname> <given-names>RL</given-names>
</name>
<name>
<surname>Laversanne</surname> <given-names>M</given-names>
</name>
<name>
<surname>Soerjomataram</surname> <given-names>I</given-names>
</name>
<name>
<surname>Jemal</surname> <given-names>A</given-names>
</name>
<etal/>
</person-group>. <article-title>Global cancer statistics 2020: GLOBOCAN estimates of incidence and mortality worldwide for 36 cancers in 185 countries</article-title>. <source>CA Cancer J Clin</source>. (<year>2021</year>) <volume>71</volume>:<page-range>209&#x2013;49</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.3322/caac.21660</pub-id>
</citation>
</ref>
<ref id="B2">
<label>2</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bruix</surname> <given-names>J</given-names>
</name>
<name>
<surname>Reig</surname> <given-names>M</given-names>
</name>
<name>
<surname>Sherman</surname> <given-names>M</given-names>
</name>
</person-group>. <article-title>Evidence-based diagnosis, staging, and treatment of patients with hepatocellular carcinoma</article-title>. <source>Gastroenterology</source>. (<year>2016</year>) <volume>150</volume>:<page-range>835&#x2013;53</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1053/j.gastro.2015.12.041</pub-id>
</citation>
</ref>
<ref id="B3">
<label>3</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname> <given-names>L</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>H</given-names>
</name>
</person-group>. <article-title>Heterogeneity of liver cancer and personalized therapy</article-title>. <source>Cancer Lett</source>. (<year>2016</year>) <volume>379</volume>:<page-range>191&#x2013;7</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.canlet.2015.07.018</pub-id>
</citation>
</ref>
<ref id="B4">
<label>4</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chan</surname> <given-names>LK</given-names>
</name>
<name>
<surname>Tsui</surname> <given-names>YM</given-names>
</name>
<name>
<surname>Ho</surname> <given-names>DW</given-names>
</name>
<name>
<surname>Ng</surname> <given-names>IO</given-names>
</name>
</person-group>. <article-title>Cellular heterogeneity and plasticity in liver cancer</article-title>. <source>Semin Cancer Biol</source>. (<year>2022</year>) <volume>82</volume>:<page-range>134&#x2013;49</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.semcancer.2021.02.015</pub-id>
</citation>
</ref>
<ref id="B5">
<label>5</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Villanueva</surname> <given-names>A</given-names>
</name>
</person-group>. <article-title>Hepatocellular carcinoma</article-title>. <source>N Engl J Med</source>. (<year>2019</year>) <volume>380</volume>:<page-range>1450&#x2013;62</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1056/NEJMra1713263</pub-id>
</citation>
</ref>
<ref id="B6">
<label>6</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Swanson</surname> <given-names>K</given-names>
</name>
<name>
<surname>Wu</surname> <given-names>E</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>A</given-names>
</name>
<name>
<surname>Alizadeh</surname> <given-names>AA</given-names>
</name>
<name>
<surname>Zou</surname> <given-names>J</given-names>
</name>
</person-group>. <article-title>From patterns to patients: Advances in clinical machine learning for cancer diagnosis, prognosis, and treatment</article-title>. <source>Cell</source>. (<year>2023</year>) <volume>186</volume>:<page-range>1772&#x2013;91</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.cell.2023.01.035</pub-id>
</citation>
</ref>
<ref id="B7">
<label>7</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kann</surname> <given-names>BH</given-names>
</name>
<name>
<surname>Hosny</surname> <given-names>A</given-names>
</name>
<name>
<surname>Aerts</surname> <given-names>H</given-names>
</name>
</person-group>. <article-title>Artificial intelligence for clinical oncology</article-title>. <source>Cancer Cell</source>. (<year>2021</year>) <volume>39</volume>:<page-range>916&#x2013;27</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.ccell.2021.04.002</pub-id>
</citation>
</ref>
<ref id="B8">
<label>8</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname> <given-names>X</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Tang</surname> <given-names>W</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>X</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>R</given-names>
</name>
<name>
<surname>Bao</surname> <given-names>H</given-names>
</name>
<etal/>
</person-group>. <article-title>Ultrasensitive and affordable assay for early detection of primary liver cancer using plasma cell-free DNA fragmentomics</article-title>. <source>Hepatology</source>. (<year>2022</year>) <volume>76</volume>:<page-range>317&#x2013;29</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/hep.32308</pub-id>
</citation>
</ref>
<ref id="B9">
<label>9</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tang</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>F</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>C</given-names>
</name>
<name>
<surname>Li</surname> <given-names>X</given-names>
</name>
<name>
<surname>Yin</surname> <given-names>M</given-names>
</name>
<etal/>
</person-group>. <article-title>Diagnosis of hepatocellular carcinoma based on salivary protein glycopatterns and machine learning algorithms</article-title>. <source>Clin Chem Lab Med</source>. (<year>2022</year>) <volume>60</volume>:<page-range>1963&#x2013;73</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1515/cclm-2022&#x2013;0715</pub-id>
</citation>
</ref>
<ref id="B10">
<label>10</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname> <given-names>X</given-names>
</name>
<name>
<surname>Ishwaran</surname> <given-names>H</given-names>
</name>
</person-group>. <article-title>Random forests for genomic data analysis</article-title>. <source>Genomics</source>. (<year>2012</year>) <volume>99</volume>:<page-range>323&#x2013;9</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.ygeno.2012.04.003</pub-id>
</citation>
</ref>
<ref id="B11">
<label>11</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sheehy</surname> <given-names>J</given-names>
</name>
<name>
<surname>Rutledge</surname> <given-names>H</given-names>
</name>
<name>
<surname>Acharya</surname> <given-names>UR</given-names>
</name>
<name>
<surname>Loh</surname> <given-names>HW</given-names>
</name>
<name>
<surname>Gururajan</surname> <given-names>R</given-names>
</name>
<name>
<surname>Tao</surname> <given-names>X</given-names>
</name>
<etal/>
</person-group>. <article-title>Gynecological cancer prognosis using machine learning techniques: A systematic review of the last three decades (1990&#x2013;2022)</article-title>. <source>Artif Intell Med</source>. (<year>2023</year>) <volume>139</volume>:<elocation-id>102536</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.artmed.2023.102536</pub-id>
</citation>
</ref>
<ref id="B12">
<label>12</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhu</surname> <given-names>J</given-names>
</name>
<name>
<surname>Su</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>B</given-names>
</name>
<name>
<surname>Sun</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Gao</surname> <given-names>W</given-names>
</name>
<etal/>
</person-group>. <article-title>Real-time biomechanical modelling of the liver using LightGBM model</article-title>. <source>Int J Med Robot</source>. (<year>2022</year>) <volume>18</volume>:<elocation-id>e2433</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/rcs.2433</pub-id>
</citation>
</ref>
<ref id="B13">
<label>13</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hamed</surname> <given-names>EA</given-names>
</name>
<name>
<surname>Salem</surname> <given-names>MA</given-names>
</name>
<name>
<surname>Badr</surname> <given-names>NL</given-names>
</name>
<name>
<surname>Tolba</surname> <given-names>MF</given-names>
</name>
</person-group>. <article-title>An efficient combination of convolutional neural network and lightGBM algorithm for lung cancer histopathology classification</article-title>. <source>Diagnostics (Basel)</source>. (<year>2023</year>) <volume>13</volume>:<elocation-id>2469</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/diagnostics13152469</pub-id>
</citation>
</ref>
<ref id="B14">
<label>14</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Penson</surname> <given-names>A</given-names>
</name>
<name>
<surname>Camacho</surname> <given-names>N</given-names>
</name>
<name>
<surname>Zheng</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Varghese</surname> <given-names>AM</given-names>
</name>
<name>
<surname>Al-Ahmadie</surname> <given-names>H</given-names>
</name>
<name>
<surname>Razavi</surname> <given-names>P</given-names>
</name>
<etal/>
</person-group>. <article-title>Development of genome-derived tumor type prediction to inform clinical cancer care</article-title>. <source>JAMA Oncol</source>. (<year>2020</year>) <volume>6</volume>:<fpage>84</fpage>&#x2013;<lpage>91</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1001/jamaoncol.2019.3985</pub-id>
</citation>
</ref>
<ref id="B15">
<label>15</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Eun</surname> <given-names>JW</given-names>
</name>
<name>
<surname>Jang</surname> <given-names>JW</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>HD</given-names>
</name>
<name>
<surname>Kim</surname> <given-names>J</given-names>
</name>
<name>
<surname>Kim</surname> <given-names>SY</given-names>
</name>
<name>
<surname>Na</surname> <given-names>MJ</given-names>
</name>
<etal/>
</person-group>. <article-title>Serum proteins, HMMR, NXPH4, PITX1 and THBS4; A panel of biomarkers for early diagnosis of hepatocellular carcinoma</article-title>. <source>J Clin Med</source>. (<year>2022</year>) <volume>11</volume>:<elocation-id>2128</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/jcm11082128</pub-id>
</citation>
</ref>
<ref id="B16">
<label>16</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhao</surname> <given-names>X</given-names>
</name>
<name>
<surname>Li</surname> <given-names>X</given-names>
</name>
<name>
<surname>Lin</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Ma</surname> <given-names>R</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Xu</surname> <given-names>D</given-names>
</name>
<etal/>
</person-group>. <article-title>Survival prediction by Bayesian network modeling for pseudomyxoma peritonei after cytoreductive surgery plus hyperthermic intraperitoneal chemotherapy</article-title>. <source>Cancer Med</source>. (<year>2023</year>) <volume>12</volume>:<page-range>2637&#x2013;45</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/cam4.5138</pub-id>
</citation>
</ref>
<ref id="B17">
<label>17</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname> <given-names>X</given-names>
</name>
<name>
<surname>Zhao</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>D</given-names>
</name>
<name>
<surname>Kuang</surname> <given-names>L</given-names>
</name>
<name>
<surname>Huang</surname> <given-names>H</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>W</given-names>
</name>
<etal/>
</person-group>. <article-title>Development of an interpretable machine learning model associated with heavy metals&#x2019; exposure to identify coronary heart disease among US adults via SHAP: Findings of the US NHANES from 2003 to 2018</article-title>. <source>Chemosphere</source>. (<year>2023</year>) <volume>311</volume>:<elocation-id>137039</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.chemosphere.2022.137039</pub-id>
</citation>
</ref>
<ref id="B18">
<label>18</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname> <given-names>XZ</given-names>
</name>
<name>
<surname>Duan</surname> <given-names>M</given-names>
</name>
<name>
<surname>Huang</surname> <given-names>HD</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Xiang</surname> <given-names>TY</given-names>
</name>
<name>
<surname>Niu</surname> <given-names>WC</given-names>
</name>
<etal/>
</person-group>. <article-title>Predicting diabetic kidney disease for type 2 diabetes mellitus by machine learning in the real world: a multicenter retrospective study</article-title>. <source>Front Endocrinol (Lausanne)</source>. (<year>2023</year>) <volume>14</volume>:<elocation-id>1184190</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fendo.2023.1184190</pub-id>
</citation>
</ref>
<ref id="B19">
<label>19</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wolf</surname> <given-names>FA</given-names>
</name>
<name>
<surname>Angerer</surname> <given-names>P</given-names>
</name>
<name>
<surname>Theis</surname> <given-names>FJ</given-names>
</name>
</person-group>. <article-title>SCANPY: large-scale single-cell gene expression data analysis</article-title>. <source>Genome Biol</source>. (<year>2018</year>) <volume>19</volume>:<fpage>15</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s13059&#x2013;017-1382&#x2013;0</pub-id>
</citation>
</ref>
<ref id="B20">
<label>20</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xu</surname> <given-names>RH</given-names>
</name>
<name>
<surname>Wei</surname> <given-names>W</given-names>
</name>
<name>
<surname>Krawczyk</surname> <given-names>M</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>W</given-names>
</name>
<name>
<surname>Luo</surname> <given-names>H</given-names>
</name>
<name>
<surname>Flagg</surname> <given-names>K</given-names>
</name>
<etal/>
</person-group>. <article-title>Circulating tumour DNA methylation markers for diagnosis and prognosis of hepatocellular carcinoma</article-title>. <source>Nat Mater</source>. (<year>2017</year>) <volume>16</volume>:<page-range>1155&#x2013;61</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/nmat4997</pub-id>
</citation>
</ref>
<ref id="B21">
<label>21</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Eraslan</surname> <given-names>G</given-names>
</name>
<name>
<surname>Simon</surname> <given-names>LM</given-names>
</name>
<name>
<surname>Mircea</surname> <given-names>M</given-names>
</name>
<name>
<surname>Mueller</surname> <given-names>NS</given-names>
</name>
<name>
<surname>Theis</surname> <given-names>FJ</given-names>
</name>
</person-group>. <article-title>Single-cell RNA-seq denoising using a deep count autoencoder</article-title>. <source>Nat Commun</source>. (<year>2019</year>) <volume>10</volume>:<fpage>390</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41467&#x2013;018-07931&#x2013;2</pub-id>
</citation>
</ref>
<ref id="B22">
<label>22</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Su</surname> <given-names>C</given-names>
</name>
<name>
<surname>Xu</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Shan</surname> <given-names>X</given-names>
</name>
<name>
<surname>Cai</surname> <given-names>B</given-names>
</name>
<name>
<surname>Zhao</surname> <given-names>H</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>J</given-names>
</name>
</person-group>. <article-title>Cell-type-specific co-expression inference from single cell RNA-sequencing data</article-title>. <source>Nat Commun</source>. (<year>2023</year>) <volume>14</volume>:<fpage>4846</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41467&#x2013;023-40503&#x2013;7</pub-id>
</citation>
</ref>
<ref id="B23">
<label>23</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Peng</surname> <given-names>HY</given-names>
</name>
<name>
<surname>Duan</surname> <given-names>SJ</given-names>
</name>
<name>
<surname>Pan</surname> <given-names>L</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>MY</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>JL</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>YC</given-names>
</name>
<etal/>
</person-group>. <article-title>Development and validation of machine learning models for nonalcoholic fatty liver disease</article-title>. <source>Hepatobiliary Pancreat Dis Int</source>. (<year>2023</year>) <volume>22</volume>:<page-range>615&#x2013;21</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.hbpd.2023.03.009</pub-id>
</citation>
</ref>
<ref id="B24">
<label>24</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lotfollahi</surname> <given-names>M</given-names>
</name>
<name>
<surname>Rybakov</surname> <given-names>S</given-names>
</name>
<name>
<surname>Hrovatin</surname> <given-names>K</given-names>
</name>
<name>
<surname>Hediyeh-Zadeh</surname> <given-names>S</given-names>
</name>
<name>
<surname>Talavera-L&#xf3;pez</surname> <given-names>C</given-names>
</name>
<name>
<surname>Misharin</surname> <given-names>AV</given-names>
</name>
<etal/>
</person-group>. <article-title>Biologically informed deep learning to query gene programs in single-cell atlases</article-title>. <source>Nat Cell Biol</source>. (<year>2023</year>) <volume>25</volume>:<page-range>337&#x2013;50</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41556-022-01072-x</pub-id>
</citation>
</ref>
<ref id="B25">
<label>25</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname> <given-names>C</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>H</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Thomas</surname> <given-names>HR</given-names>
</name>
<name>
<surname>Frank</surname> <given-names>MH</given-names>
</name>
<name>
<surname>He</surname> <given-names>Y</given-names>
</name>
<etal/>
</person-group>. <article-title>TBtools: an integrative toolkit developed for interactive analyses of big biological data</article-title>. <source>Mol Plant</source>. (<year>2020</year>) <volume>13</volume>:<page-range>1194&#x2013;202</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.molp.2020.06.009</pub-id>
</citation>
</ref>
<ref id="B26">
<label>26</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname> <given-names>C</given-names>
</name>
<name>
<surname>Wu</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Li</surname> <given-names>J</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>X</given-names>
</name>
<name>
<surname>Zeng</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Xu</surname> <given-names>J</given-names>
</name>
<etal/>
</person-group>. <article-title>TBtools-II: A &#x201c;one for all, all for one&#x201d; bioinformatics platform for biological big-data mining</article-title>. <source>Mol Plant</source>. (<year>2023</year>) <volume>16</volume>:<page-range>1733&#x2013;42</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.molp.2023.09.010</pub-id>
</citation>
</ref>
<ref id="B27">
<label>27</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tang</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Kang</surname> <given-names>B</given-names>
</name>
<name>
<surname>Li</surname> <given-names>C</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>T</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>Z</given-names>
</name>
</person-group>. <article-title>GEPIA2: an enhanced web server for large-scale expression profiling and interactive analysis</article-title>. <source>Nucleic Acids Res</source>. (<year>2019</year>) <volume>47</volume>:<page-range>W556&#x2013;W60</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/nar/gkz430</pub-id>
</citation>
</ref>
<ref id="B28">
<label>28</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wu</surname> <given-names>T</given-names>
</name>
<name>
<surname>Hu</surname> <given-names>E</given-names>
</name>
<name>
<surname>Xu</surname> <given-names>S</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>M</given-names>
</name>
<name>
<surname>Guo</surname> <given-names>P</given-names>
</name>
<name>
<surname>Dai</surname> <given-names>Z</given-names>
</name>
<etal/>
</person-group>. <article-title>clusterProfiler 4.0: A universal enrichment tool for interpreting omics data</article-title>. <source>Innovation (Camb)</source>. (<year>2021</year>) <volume>2</volume>:<fpage>100141</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.xinn.2021.100141</pub-id>
</citation>
</ref>
<ref id="B29">
<label>29</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Luo</surname> <given-names>D</given-names>
</name>
<name>
<surname>Fang</surname> <given-names>M</given-names>
</name>
<name>
<surname>Shao</surname> <given-names>L</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>J</given-names>
</name>
<name>
<surname>Liang</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>M</given-names>
</name>
<etal/>
</person-group>. <article-title>The EMT-related genes GALNT3 and OAS1 are associated with immune cell infiltration and poor prognosis in lung adenocarcinoma</article-title>. <source>Front Biosci (Landmark Ed)</source>. (<year>2023</year>) <volume>28</volume>:<elocation-id>271</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.31083/j.fbl2810271</pub-id>
</citation>
</ref>
<ref id="B30">
<label>30</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dai</surname> <given-names>W</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>T</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>J</given-names>
</name>
<name>
<surname>Wu</surname> <given-names>W</given-names>
</name>
<name>
<surname>Gu</surname> <given-names>J</given-names>
</name>
</person-group>. <article-title>Downregulation of exosomal CLEC3B in hepatocellular carcinoma promotes metastasis and angiogenesis via AMPK and VEGF signals</article-title>. <source>Cell Commun Signal</source>. (<year>2019</year>) <volume>17</volume>:<fpage>113</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s12964&#x2013;019-0423&#x2013;6</pub-id>
</citation>
</ref>
<ref id="B31">
<label>31</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Neumann</surname> <given-names>O</given-names>
</name>
<name>
<surname>Kesselmeier</surname> <given-names>M</given-names>
</name>
<name>
<surname>Geffers</surname> <given-names>R</given-names>
</name>
<name>
<surname>Pellegrino</surname> <given-names>R</given-names>
</name>
<name>
<surname>Radlwimmer</surname> <given-names>B</given-names>
</name>
<name>
<surname>Hoffmann</surname> <given-names>K</given-names>
</name>
<etal/>
</person-group>. <article-title>Methylome analysis and integrative profiling of human HCCs identify novel protumorigenic factors</article-title>. <source>Hepatology</source>. (<year>2012</year>) <volume>56</volume>:<page-range>1817&#x2013;27</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/hep.25870</pub-id>
</citation>
</ref>
<ref id="B32">
<label>32</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fu</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>S</given-names>
</name>
<name>
<surname>Rodrigues</surname> <given-names>RM</given-names>
</name>
<name>
<surname>Han</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Guo</surname> <given-names>C</given-names>
</name>
<name>
<surname>Zhu</surname> <given-names>Z</given-names>
</name>
<etal/>
</person-group>. <article-title>Activation of VIPR1 suppresses hepatocellular carcinoma progression by regulating arginine and pyrimidine metabolism</article-title>. <source>Int J Biol Sci</source>. (<year>2022</year>) <volume>18</volume>:<page-range>4341&#x2013;56</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.7150/ijbs.71134</pub-id>
</citation>
</ref>
<ref id="B33">
<label>33</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rong</surname> <given-names>MH</given-names>
</name>
<name>
<surname>Li</surname> <given-names>JD</given-names>
</name>
<name>
<surname>Zhong</surname> <given-names>LY</given-names>
</name>
<name>
<surname>Huang</surname> <given-names>YZ</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>J</given-names>
</name>
<name>
<surname>Xie</surname> <given-names>LY</given-names>
</name>
<etal/>
</person-group>. <article-title>CCNB1 promotes the development of hepatocellular carcinoma by mediating DNA replication in the cell cycle</article-title>. <source>Exp Biol Med (Maywood)</source>. (<year>2022</year>) <volume>247</volume>:<fpage>395</fpage>&#x2013;<lpage>408</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1177/15353702211049149</pub-id>
</citation>
</ref>
<ref id="B34">
<label>34</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gu</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Li</surname> <given-names>X</given-names>
</name>
<name>
<surname>Bi</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Zheng</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>J</given-names>
</name>
<name>
<surname>Li</surname> <given-names>X</given-names>
</name>
<etal/>
</person-group>. <article-title>CCL14 is a prognostic biomarker and correlates with immune infiltrates in hepatocellular carcinoma</article-title>. <source>Aging (Albany NY)</source>. (<year>2020</year>) <volume>12</volume>:<fpage>784</fpage>&#x2013;<lpage>807</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.18632/aging.102656</pub-id>
</citation>
</ref>
<ref id="B35">
<label>35</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname> <given-names>J</given-names>
</name>
<name>
<surname>Ding</surname> <given-names>C</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Hu</surname> <given-names>W</given-names>
</name>
<name>
<surname>Lu</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Wu</surname> <given-names>W</given-names>
</name>
<etal/>
</person-group>. <article-title>ACSL4 promotes hepatocellular carcinoma progression via c-Myc stability mediated by ERK/FBW7/c-Myc axis</article-title>. <source>Oncogenesis</source>. (<year>2020</year>) <volume>9</volume>:<fpage>42</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41389-020-0226-z</pub-id>
</citation>
</ref>
<ref id="B36">
<label>36</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lin</surname> <given-names>XH</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>DY</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>ZY</given-names>
</name>
<name>
<surname>Tang</surname> <given-names>WQ</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>RX</given-names>
</name>
<name>
<surname>Li</surname> <given-names>DP</given-names>
</name>
<etal/>
</person-group>. <article-title>lncRNA-AC079061.1/VIPR1 axis may suppress the development of hepatocellular carcinoma: a bioinformatics analysis and experimental validation</article-title>. <source>J Transl Med</source>. (<year>2022</year>) <volume>20</volume>:<fpage>379</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s12967&#x2013;022-03573&#x2013;7</pub-id>
</citation>
</ref>
<ref id="B37">
<label>37</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhu</surname> <given-names>M</given-names>
</name>
<name>
<surname>Xu</surname> <given-names>W</given-names>
</name>
<name>
<surname>Wei</surname> <given-names>C</given-names>
</name>
<name>
<surname>Huang</surname> <given-names>J</given-names>
</name>
<name>
<surname>Xu</surname> <given-names>J</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>Y</given-names>
</name>
<etal/>
</person-group>. <article-title>CCL14 serves as a novel prognostic factor and tumor suppressor of HCC by modulating cell cycle and promoting apoptosis</article-title>. <source>Cell Death Dis</source>. (<year>2019</year>) <volume>10</volume>:<fpage>796</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41419&#x2013;019-1966&#x2013;6</pub-id>
</citation>
</ref>
<ref id="B38">
<label>38</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname> <given-names>J</given-names>
</name>
<name>
<surname>Ding</surname> <given-names>C</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Hu</surname> <given-names>W</given-names>
</name>
<name>
<surname>Yu</surname> <given-names>C</given-names>
</name>
<name>
<surname>Peng</surname> <given-names>C</given-names>
</name>
<etal/>
</person-group>. <article-title>ACSL4 reprograms fatty acid metabolism in hepatocellular carcinoma via c-Myc/SREBP1 pathway</article-title>. <source>Cancer Lett</source>. (<year>2021</year>) <volume>502</volume>:<page-range>154&#x2013;65</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.canlet.2020.12.019</pub-id>
</citation>
</ref>
<ref id="B39">
<label>39</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Calderaro</surname> <given-names>J</given-names>
</name>
<name>
<surname>Seraphin</surname> <given-names>TP</given-names>
</name>
<name>
<surname>Luedde</surname> <given-names>T</given-names>
</name>
<name>
<surname>Simon</surname> <given-names>TG</given-names>
</name>
</person-group>. <article-title>Artificial intelligence for the prevention and clinical management of hepatocellular carcinoma</article-title>. <source>J Hepatol</source>. (<year>2022</year>) <volume>76</volume>:<page-range>1348&#x2013;61</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.jhep.2022.01.014</pub-id>
</citation>
</ref>
<ref id="B40">
<label>40</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xie</surname> <given-names>H</given-names>
</name>
<name>
<surname>Xue</surname> <given-names>YQ</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>P</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>PJ</given-names>
</name>
<name>
<surname>Tian</surname> <given-names>ST</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>Z</given-names>
</name>
<etal/>
</person-group>. <article-title>Multi-parameter gene expression profiling of peripheral blood for early detection of hepatocellular carcinoma</article-title>. <source>World J Gastroenterol</source>. (<year>2018</year>) <volume>24</volume>:<page-range>371&#x2013;8</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.3748/wjg.v24.i3.371</pub-id>
</citation>
</ref>
<ref id="B41">
<label>41</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kaur</surname> <given-names>H</given-names>
</name>
<name>
<surname>Dhall</surname> <given-names>A</given-names>
</name>
<name>
<surname>Kumar</surname> <given-names>R</given-names>
</name>
<name>
<surname>Raghava</surname> <given-names>GPS</given-names>
</name>
</person-group>. <article-title>Identification of platform-independent diagnostic biomarker panel for hepatocellular carcinoma using large-scale transcriptomics data</article-title>. <source>Front Genet</source>. (<year>2020</year>) <volume>10</volume>:<elocation-id>1306</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fgene.2019.01306</pub-id>
</citation>
</ref>
<ref id="B42">
<label>42</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Johnson</surname> <given-names>PJ</given-names>
</name>
<name>
<surname>Pirrie</surname> <given-names>SJ</given-names>
</name>
<name>
<surname>Cox</surname> <given-names>TF</given-names>
</name>
<name>
<surname>Berhane</surname> <given-names>S</given-names>
</name>
<name>
<surname>Teng</surname> <given-names>M</given-names>
</name>
<name>
<surname>Palmer</surname> <given-names>D</given-names>
</name>
<etal/>
</person-group>. <article-title>The detection of hepatocellular carcinoma using a prospectively developed and validated model based on serological biomarkers</article-title>. <source>Cancer Epidemiol Biomarkers Prev</source>. (<year>2014</year>) <volume>23</volume>:<page-range>144&#x2013;53</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1158/1055&#x2013;9965.EPI-13&#x2013;0870</pub-id>
</citation>
</ref>
<ref id="B43">
<label>43</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xing</surname> <given-names>X</given-names>
</name>
<name>
<surname>Cai</surname> <given-names>L</given-names>
</name>
<name>
<surname>Ouyang</surname> <given-names>J</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>F</given-names>
</name>
<name>
<surname>Li</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>M</given-names>
</name>
<etal/>
</person-group>. <article-title>Proteomics-driven noninvasive screening of circulating serum protein panels for the early diagnosis of hepatocellular carcinoma</article-title>. <source>Nat Commun</source>. (<year>2023</year>) <volume>14</volume>:<fpage>8392</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41467&#x2013;023-44255&#x2013;2</pub-id>
</citation>
</ref>
</ref-list>
</back>
</article>